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FIG. 3 



□ specifier=address+( size/2)+(width /2) 
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depth = 4 bytes 



width = 16 bytel] J\ l5ize = depth I width = 64 bytel 



address is aligned to size (64 bytes), 
so low-order 6 bits are zero 



address \ aaaaaaoaaaaaaaaaaooaaoaaaaa aaaaaoaaaa | QQQQQQ J 
size/2 | OOOOOOOOOOOOOOOOOOOOOOOOOOooooooo | WOOOO] 
width/2 | OOOOOOOOOOOOOOOOOOOOOOOOOOooooooo \ 001 QQO | 



specifier 
500 



aaaaaaaaaaaaaaaaaaoaoaaaoaao aaaaaaaa a | J0100Q] 

^ " ' s — 

505 r-i^ r- 570 



FIG. 5 

specifier \oaaaaaaaaoaoaaaaoaaaoaaaoaa aoaaaaaaaa \ 101 000 \ ^ 610 



600 



605 



g75 N TinP(Q- s ) | 

urn/to/? | ooooooooooooooooooooooooooooooooo * I oo ioolk 

620 g ^ 5 ^ Hs end nof Aw/to/?;} 



aaaaaaaaaaaaaaaaaaaaoaoaaaa aaaaaaaaaa \ W QOQO] 



630 



gJ5 N f and '(0-t) | 
1 000000000000000000000000000000000 f 1 100000 I 

g * 5 ^ H f ^ not (size/2) I 
address \ aaaaaaaaaaaaaaoaaaoaaaaaa aaaaooaaaaaa | qqoqoq\ 

650 

FIG. 6 
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□ W777 c.c contents 



□ wmc.pa-physical address 
Owmc. size- size of contents 
\2wmc.cv-con tents valid 
Uwmc.th- thread last used 

□ wmc.reg-register last used 
Uwmc.rtv-register & thread valid 
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def data.flags <- AccessPhysicalLTB(pa,op,wdata) as 
th<-pa23..i9 
en pa6..4 

if (en < (1 || 0 LE )) and (th < T) and (paie..6=0) then 
case op of 
R: 

data <- 0 64 || LTBArray[th][en] 

W: 

LocalTB[ui][en] <- wdata63..o 

endcase 

else 

data <- 0 

end if 
enddef 

Fig. 16 
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def ga.LocalProtect <- LocalTranslationfth.ba.la.pl) as 
if LB & (ba63..48 © I363..48) then 

raise AccessDisallowedByVirtualAddress 

endif 

me <- NONE 

for i <- 0 to (1 |t 0 LE )-1 

if (I363..48 & ^LocalTB[th][G 6 3..4 8 ) = LocalTB[th][i] 47 ..3 2 then 
me <- i 

endif 
endfor 

if me = NONE then 

if ~ControlRegister p i+8 then 
raise LocalTBMiss 

endif 
ga <- la 

LocalProtect <- 0 

else 

ga <- (V363..48 A LocalTB[th][me]3i..i6) || va 4 7..o 
LocalProtect <- LocalTB[th][me]i5..o 

endif 
enddef 

Fig. 22 
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def data,flags <- AccessPhysicalGTB(pa,op,wdata) as 
th<-pa 2 3..19+GTl| 0 GT 
en<-pai8.4 

if (en < (1 || 0 G )) and (th < T) and (pai 8+GT ..i 9 = 0) then 
case op of 



R: 
W: 



data +- GTB Array [th 5 ..GT] [en] 
GTBArray[th5..GT][en] <- wdata 



else 



endcase 



data <- 0 



endif 



enddef 



Fig. 24 
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def pa.GlobalProtect <- GlobalAddressTranslation(th,ga f pl,lda) as 
me <- NONE 
fori<-0to(1 ||0 G )-1 

if GiobalTB[th 5 ..GT]['] * 0 then 

size «- (GlobalTB[th 5 ..GT][063.J and (0 64 -GlobalTB(th 5 .. G T][i]63..7)) II 0 8 
if ((ga63..8l|0 8 ) A (GlobalTB[th 5 ..GT]ti]63..8l!0 8 )) and (0 64 -size)) = 0 then 
me <- Globa!TB[th5..GT][0 

endif 

end if 
endfor 

if me = NONE then 
if Ida then 

PerformAccessDetail(AccessDetailRequiredByLocalTB) 

endif 

raise GlobaiTBMiss 

else 

pa <- (ga 6 3..8 A GlobalTB[th5..GT][me] 12 7.J2) II 937..0 

GlobalProtect *- GlobalTB[th 5 .. G T][me]7i..64 II 0 1 || GlobalTB[th 5 .. G T][me]6..o 

endif 
enddef 

Fig. 26 



def GTBUpdateWrite(th,fill t data) as 
me <- NONE 
fori ^0 to (1 || 0 G )-1 

size <- (GiobalTB[th 5 ..GT][i]63..7 and (0 64 -GlobaITB(th 5 .. G T][']63..7)) II 0 8 
if ((data 63 .. 8 ||0 8 ) A (GlobalTB[th 5 .. G T][063..8l|O 8 )) and (0 64 -size) = 0 then 
me <- i 

endif 
endfor 

if me = NONE then 
if fill then 

GlobalTB[th 5 ..GT][GTBLast[th 5 ..GT]] <- data 
GTBLast[th 5 ..GT] «- (GTBLast[th 5 „ G T] + 1)G-1..0 
if GTBLast[th 5 ..GT] = 0 then 

GTBLast[th 5 „GT] *- GTBFirst[th 5 .. G T] 

GTBBump[th5 # gt] «- 1 

endif 

endif 

else 

GlobalTB[th5. p GT][me] <- data 

endif 
enddef 

Fig. 27 
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def data.flags AccessPhysicalGTBRegisters(pa,op,wdata) as 
th*-pa 2 3..19+GTl|0 GT 
rn <- pai8..8 

if (rn < 5) and (th < T) and (pais+GT..19 = 0) and (P a 7..4 = °) then 
case rn || op of 
0|| R,1|| R: 

data <r- 0 
0 || W, 1 || W: 

GTBUpdateWrite(th,rno,wdata) 



2||R: 




data O 64 ' 6 || GTBLast[th 5 .. G T] 


2| 


|W: 




GTBLast[th5„GT] «- wdataQ-i..o 


3| 


I R: 




data <- O 64 ' 0 || GTBFirst[th 5 ..GT] 


3| 


| W: 




GTBFirst[th5 qt] *- wdataG-1 o 


3| 


|R: 




data *- 0 63 || GTBBump[th 5 ..GT] 


3| 


| W: 



GTBBump[th5 #> GT] <- wdatao 

endcase 

else 

data <- 0 

endif 
enddef 



Fig. 30 



I G. BOOLEAN | Group Boolean 

Equivalencies 



G.AAA 


Group three-way and 


G.AAA.1 


Group add add add bits 


G.AAS.1 


Group add add subtract bits 


G.ADD.1 


Group add bits 


G.AND 


Group and 


G.ANDN 


Group and not 


G.COPY 


Group copy 


G.N AAA 


Group three-way nand 


G.NAND 


Group nand 


G.NOOO 


Group three-way nor 


G.NOR 


Group nor 


G.NOT 


Group not 


G.NXXX 


Group three-way exclusive-nor 


G.000 


Group three-way or 


G.OR 


Group or 


G.ORN 


Group or not 


G.SAA.1 


Group subtract add add bits 


G.SAS.1 


Group subtract add subtract bits 


G.SET 


Group set 


G.SET.AND.E.1 


Group set and equal zero bits 


G.SET.AND.NE.1 


Group set and not equal zero bits 


G.SET.E.1 


Group set equal bits 


G.SET.G.1 


Group set greater signed bits 


G.SET. G.U.I 


Group set greater unsigned bits 


G.SET.G.Z.1 


Group set greater zero signed bits 


G.SET.GE.1 


Group set greater equal signed bits 


G.SET.GE.Z.1 


Group set greater equal zero signed bits 


G.SET.L1 


Group set less signed bits 


G.SET.LZ.1 


Group set less zero signed bits 


G.SET. LE.1 


Group set less equal signed bits 


G.SET.LE.U.1 


Group set less equal unsigned bits 


G.SET. LE.Z.1 


Group set less equal zero signed bits { 


G.SET.NE.1 


Group set not equal bits 


G.SET.GE.U.1 


Group set greater eaual unsigned bits 


G.SET.L.U.1 


Group set less unsigned bits 



Fig. 31A 



G.SSA.1 


Group subtract subtract add bits 


G.SSS.1 


Group subtract subtract subtract bits 


G.SUB.1 


Group subtract bits 


G.XNOR 


Group exclusive-nor 


G.XOR 


Group exclusive-or 


G.XXX 


Group three-way exclusive-or 


G.ZERO 


Group zero 




G.AAA rd@rc,rb 


<- G. BOOLEAN rd@rc,rb,0b1 0000000 


G.AAA.1 rd@rc,rb 


-> G.XXX rd@rc,rb 


G.AAS.f rd@rc,rb 


-» G.XXX rd@rc,rb 


G.ADD. 1 rd=rc,rb 


-»■ G.XOR rd=rc,rb 


G.AND rd=rc,rb 


«- G.BOOLEAN rd@rc,rb,0b1 0001 000 


G.ANDN rd-rc,rb 


<- G.BOOLEAN rd@rc,rb,0b01 000100 


G. BOOLEAN rd@rb,rc,i 


-> G.BOOLEAN rd@rc,rb,i7i5i6i4i3iii2'0 


G.COPYrd=rc 


<- G.BOOLEAN rd@rc,rc,0b1 0001 000 


G.NAAA. rd@rc,rb 


<- G.BOOLEAN rd@rc,rb,0b01 111111 


G.NAND rd=rc,rb 


<- G.BOOLEAN rd@rc,rb,0b01 1 101 1 1 


G.NOOO rd@rc,rb 


<- G.BOOLEAN rd@rc,rb,0b00000001 


G.NOR rd=rc,rb 


<- G.BOOLEAN rd@rc,rb,0b000 10001 


G.NOTrd=rc 


<- G.BOOLEAN rd@rc,rc,0b00010001 


G.NXXX rd@rc,rb 


<r- G.BOOLEAN rd@rc,rb,0b01 101 001 


G.000 rd@rc,rb 


<- G.BOOLEAN rd@rc,rb,0b1 11 11 110 


G.0Rrd=rc,rb 


<- G.BOOLEAN rd@rc,rb,0b1 1101110 


G.ORN rd=rc,rb 


<- G.BOOLEAN rd@rc,rb,0b1 101 11 01 | 


G.SAA.1 rd@rc,rb 


G.XXX rd@rc,rb 


G.SAS.1 rd@rc,rb 


-> G.XXX rd@rc,rb 


G.SETrd 


<- G.BOOLEAN rd@rd,rd,0b1 0000001 


G.SETAND.E.1 rd-rb,rc -» G.NAND rd=rc,rb 


G.SET.AND.NE.1 rd=rb,rc -+ G.AND rd=rc,rb 


G.SET.E.1 rd=rb,rc 


-> G.XNOR rd=rc,rb | 


G.SET.G.1 rd=rb,rc 


G.ANDN rd=rc,rb 


G.SET.G.U.1 rd=rb,rc 


-> G.ANDN rd=rb,rc 


G.SET.G.Z.1 rd=rc 


-» G.ZERO rd 


G.SET.GE.1 rd=rb,rc 


G.ORN rd=rc,rb 


G. SET. GE.Z. 1 rd=rc 


-» G.NOT rd=rc 


Fig. 31A (cont'd) 



G.SET.L1 rd=rb,rc 


-» 


G.ANDN rd=rb,rc 


G.SET.L.Z.1 rd=rc 


-> 


G.COPY rd=rc 


G.SET.LE. 1 rd=rb,rc 


-> 


CORN rd=rb,rc 


G.SET.LE.U.1 rd=rb,rc 


-> 


G.ORN rd=rc,rb 


G.SET.LE.Z.1 rd=rc 


-» 


G.SET rd 


G.SET.NE.1 rd=rb,rc 


-> 


G.XOR rd=rc ( rb 


G.SET.GE.U.1 rd=rb,rc 


-» 


G.ORN rd=rb,rc 


G. SET.L U. 1 rd=rb,rc 




G.ANDN rd=rc,rb 


G.SSA.1 rd@rc,rb 


-> 


G.XXX rd@rc,rb 


G.SSS.1 rd@rc.rb 


-> 


G.XXX rd@rc,rb | 


G.SUB.1 rd=rc,rb 


-> 


G.XOR rd=rc,rb 


G.XNOR rd=rc,rb 


<r- 


G.BOOLEAN rd@rc,rb,0b10011001 


G.XOR rd=rc,rb 


<r~ 


G.BOOLEAN rd@rc,rb,0b01100110 


G.XXX rd@rc,rb 


<r- 


G.BOOLEAN rd@rc,rb,0b10010110 


G.ZERO rd 


<- 


G.BOOLEAN rd@rd,rd,0b00000000 



Selection 



operation 


function (binary) 


function (decimal) 


d 


11110000 j 


240 


c 


11001100 


204 


b 


10101010 


176 | 


d&c&b 


10000000 


128 


(d&c)|b 


11101010 


234 


dlc|b 


11111110 


254 


d?c:b 


11001010 


202 


d^b 


10010110 


150 | 


-d^b 


01101001 


105 


0 


00000000 


0 



Fig. 31A (cont'd) 



Format 

G.BOOLEANrd@trc,trb,f 
rd=gbooleani(rd,rc,rb,f) 

31 252423 18 17 12 11 65 0 

[""cTboolean |ih| rd | rc | rb I il j 

7 1 6 6 6 6 

if f6=f5 then 

if f2=f 1 then 

if f2 then 

rc <- max(trc,trb) 
rb <- min(trc,trb) 

else 

rc <- min(trc,trb) 
rb <- max(trc,trb) 

endif 
ih<-0 

il<-0||f6||f7||f4||f3l|f0 

else 

if f2 then 

rc <- trb 
rb <- trc 

else 

rc <- trc 
rb <- trb 

endif 
ih«-0 

» <- 1 II II f7 II t* II II fb . 

endif 

else 

ih <— 1 
if f6 then 

rc<-trb 

rb <- trc 

H^fll|f2l|f7||f4||f3l|f0 

else 

rc <- trc 
rb<-trb 

il<-f2||fll|f7||f4l|f3l|f0 

endif 

endif 

Fig. 31B 



Definition 

def GroupBoolean (ih,rd,rc,rb f il) 
d <- RegRead(rd, 128) 
c <r- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
if ih=0 then 

if il5=0 then 

f<-il 3 ||il 4 P4 II il2 II "I II (rc>rb)2||il 0 

else 

f<-il 3 P4 II "4 II 12 II "1 II 0 || 1 || ilo 

endif 

else 

f4-l3l|0||1||il2||Hi||il5||l4l|H0 

endif 

fori<-0to 127 by size 

ai<-f(dj||ci||bi) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

none 



Fig. 31C 



Operati n cod s 



IG.MUX 


Group multiplex 


1 


Redundancies 


G.MUX ra=rd,rc,rc 


o 


G.COPYra=rc 


G.MUX ra=ra,rc,rb 


<=> 


G.BOOLEAN ra@rc,rb,0x1 1001010 


G.MUX ra=rd,ra,rb 


<=> 


G. BOOLEAN ra@rd,rb,0x1 1100010 


G.MUX ra=rd,rc,ra 


o 


G.BOOLEAN ra@rd,rc,0x1 101 1000 


G.MUX ra=rd,rd,rb 


o 


G.OR ra=rd,rb 


G.MUX ra=rd,rc,rd 


o 


G.AND ra=rd,rc 



Format 



G.MUX ra=rd,rc,rb 
ra=gmux(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

f G.MUX | rd | rc | rb | ra | 

8 6 6 6 6 

Fig.31D 



Definition 

def GroupTernaryCop.size.rd.rc.rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- R6gRead(rb, 128) 
case op of 
G.MUX: 

a <- (c and d) or (b and not d) 

endcase 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 

Fig. 31D 



G.ADD.8 


Group add bytes * 


G.ADD.16 


Group add doublets 


G.ADD.32 


Group add quadlets 


G.ADD.64 


Group add octlets 


G.ADD.128 


Group add hexlet 


G.ADD.L.8 


Group add limit signed bytes j 


G.ADD.L.16 


Group add limit signed doublets 


G.ADD.L.32 


Group add limit signed quadlets 


G.ADD.L64 


Group add limit signed octlets 


G.ADD.L128 


Group add limit signed hexlet 


G.ADD.L.U.8 


Group add limit unsigned bytes 


G.ADD.L.U.16 


Group add limit unsigned doublets 


G.ADD.L.U.32 


Group add limit unsigned quadlets 


G.ADD.L.U.64 


Group add limit unsigned octlets 


G.ADD.LU.128 


Group add limit unsigned hexlet 


G.ADD.8.0 


Group add signed bytes check overflow 


G.ADD.16.0 


Group add signed doublets check overflow 


G.ADD.32.0 


Group add signed quadlets check overflow 


G.ADD.64.0 


Group add signed octlets check overflow 


G.ADD.128.0 


Group add signed hexlet check overflow 


G.ADD.U.8.0 


Group add unsigned bytes check overflow 


G.ADD.U.16.0 


Group add unsigned doublets check overflow 


G.ADD.U.32.0 


Group add unsigned quadlets check overflow 


G.ADD.U.64.0 


Group add unsigned octlets check overflow 


G.ADD.U.128.0 


Group add unsigned hexlet check overflow 



Fig. 32A 



Format 



G.op.size rd=rc,rb 
rd=gopsize(rc,rb) 

31 24 23 18 17 12 11 6 5 0 

| G.size | rd | rc | rb | op 

8 6 6 6 6 



Fig. 32B 



Definition 



def Group(op ( size f rd,rc,rb) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 
G.ADD: 

for i <- 0 to 1 28-size by size 

ai+size-1J <- Ci+size-1..i + bi+size-1..i 
endfor 
G.ADD.L: 

for i <- 0 to 1 28-size by size 

t <- (Cj+size-1 II Ci+size-1..i) + (bi+size-1 II bi+size-1..i) 

ai+size-1..i «- (tsize * t size -i) ? (t S j 2e || tfjlg:}) ' t S ize-1..0 
endfor 
G.ADD.LU: 

for i <- 0 to 1 28-size by size 

t <- (0 1 || Ci + size-1..i) + (0 1 || bj+size-u) 

aj+size-U <- (tsize * 0) ? (1 slze ) : t S ize-1..0 
endfor 
G.ADD.O: 

for i <- 0 to 1 28-size by size 

t <- (Ci+size-1 II Cj+size-1..i) + (bj+size-1 II bj+ S ize-1 ..i) 

if t S jze * * S j ze -i then 

raise FixedPointArithmetic 

endif 

a i+size-1..i «- t s j ze -i..o 
endfor 
G.ADD.U.O: 

for i <- 0 to 1 28-size by size 

t«-<pi II c i+size-1..i) + (0 1 II b i+s »ze-1..i) 
if tsize * 0 then 

raise FixedPointArithmetic 

endif 

a i+size-1..i <- *size-1 ..0 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 32C 



Operation codes 



Ci qpj AKin F ft 

u.OC 1 ./AINL/.C.O 


f^mnn cot and pnnal 7Prn hx/tpc 


H 9FT AND F 1fi 

U.OC I ./AINL/.C IU 


f^mnn cot and phiiaI 7Prn dmihlptc 


O.Ol I .nlNU.u.O^ 


firm in QPt and phi lal 7Prn ni isidlotc 

VJIUU|J dCl dl IU CV^Udl ^CIU VjUCiUlcld 


n ^FT AMD F fid 


f^rm in cot and pnual 7Prn nrtlptc 


QFT AMH F 19ft 
U.oC I .MINL/.C. IZO 


firAnn cot and pdi iq! Tarn Hovlot 


QFT AMn MP ft 


CXmi in. cot onH not oni ia\ 7orn K\/toc 


QPT AMn MF 1ft 
O.ut I .MINU.INC. ID 


uroup sei diiu noi equal zero oouoieis 


d QFT AMH MF ^9 
b.OC I .AINU. INC. oz 


/^tai m eoi onH not aai i *n 1 TAm ai 1 aW 1 A^r* 

uroup sei dnu noi equal zero quauieis 


r> OCT A MH MC ft>1 
u.OC 1 .AINU. INC. 04 


uroup set ana noi equal zero ocueis 


n OCT AMR MC iOQ 

u.oc 1 .AINU. INc. Izo 


uroup set ana noi equal zero nexiet 


r* OCT C Q 

u.oc 1 .c.o 


uroup sex equal oytes 


ri OCT C A ft 
U.OC 1 .C.l O 


firAi ir*\ cot Am 10I /4ai iKIa4p 

uroup sei equal oouoieis 


OCT C QO 

u.oc 1 .c.oz 


fZrnt 1 a eaf aai ia| a i ioHIaIco 

uroup sei equal quauieis 


O OCT C PA 

u.oc 1 .C.D4 


r2fAI I A Cftf AAI 1 a| AaI IaIp 

uroup sei equal ociieis 


^ OCT F lOft 
U.OC 1 .C. 1 Zo 


^pai m eot aai ia| hAvlot 

uroup sei equal nexiet 


Oct fSF ft 
U.OC 1 .uc.o 


"tai 1 a oot a ro ofor aai ia| cinnA^ h\\rf ao 

uroup sei greaier equal signeu uyxes 


CI OCT /^C 4ft 
U.OC 1 .uC. 1 D 


(2rAi in cot Offistor a a i ia| cinnfiH Hni iKIaIc 1 

uroup sei greater equal signeu uouuieis 


CX QFT fiF ^9 
U.OC I .UC.oZ 


rAi 1 a paJ nroator aai ia| cinnoH ai i a^I oto 

uroup sei greaier equal signeu quauieis 


n oct r*c ft/i 
u.oc 1 .UC.D4 


uroup sei greaier equal signed octiets 


n OCT PC HOQ 

u.oc 1 .uc.lzo 


uroup sei greater equal signed nexiei 


n oct nzz 1 1 p 

U.OC 1 .UC.U.O 


uroup sei greater equal unsigned oytes 


f> OCT HC M i ft 
U.OC 1 .UC.U.1D 


uroup set greater equal unsigned oouDiets 


OCT PC 1 1 QO 

u.oc 1 .bc.U.OZ 


uroup set greater equal unsigned quauieis 


OCT PC 1 1 ft /I 

u.oc 1 .UC.U.D4 


uroup set greater equal unsigned octiets 


n OCT PC 1 1 iOQ 

u.oc 1 .bt.U.lZo 


uroup set greater equal unsigned nexiet 


p OCT 1 ft 
u.oc 1 .L.o 


uroup set signed less oytes 


OCT 11ft i 
u.oc I .L. I D 


|_ 1 IA tf*AT PIAAAA lA*^**» | L^v 1 /-\ ^ 

uroup sei signed less oouoieis 


n OCT I QO 

u.oc I .L.oz 


uroup set signed less quaoiets 


n OCT I ft/! 

u.oc I .L.04 


uroup set signed less octiets 


p OCT I 10ft 

u.oc i .l.t zo 


uroup set signed less nexiet 


G SET L U 8 


Groun set less unsianed bvte«. 


G.SET.L.U.16 


Group set less unsigned doublets 


G.SET.L.U.32 


Group set less unsigned quadlets 


G.SET.L.U.64 


Group set less unsigned octiets 


G.SET.L.U.128 


Group set less unsigned hexlet 


G.SET.NE.8 


Group set not equal bytes 


G.SET.NE.16 


Group set not equal doublets 
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G.SET.NE.32 


Group set not equal quadlets 


G.SET.NE.64 


Group set not equal octlets 


G.SET.NE.128 


Group set not equal hexlet 


G.SUB.8 


Group subtract bytes 


G.SUB.8.0 


Group subtract signed bytes check overflow 


G.SUB.16 


Group subtract doublets 


G.SUB.16.0 


Group subtract signed doublets check overflow 


G.SUB.32 


Group subtract quadlets 


G.SUB.32.0 


Group subtract signed quadlets check overflow 


G.SUB.64 


Group subtract octlets 


G.SUB.64.0 


Group subtract signed octlets check overflow 


G.SUB.128 


Group subtract hexlet 


G.SUB.128.0 


Group subtract signed hexlet check overflow 


G.SUB.L8 


Group subtract limit signed bytes 


G.SUB.L.16 


Group subtract limit signed doublets 


G.SUB.L32 


Group subtract limit signed quadlets 


G.SUB.L64 


Group subtract limit signed octlets 


G.SUB.L128 


Group subtract limit signed hexlet 


G.SUB.L.U.8 


Group subtract limit unsigned bytes 


G.SUB.LU.16 


Group subtract limit unsigned doublets 


G.SUB.LU.32 


Group subtract limit unsigned quadlets 


G.SUB.LU.64 


Group subtract limit unsigned octlets 


G.SUB.LU.128 


Group subtract limit unsigned hexlet 


G.SUB.U.8.0 


Group subtract unsigned bytes check overflow 


G.SUB.U.16.0 


Group subtract unsigned doublets check overflow 


G.SUB.U.32.0 


Group subtract unsigned quadlets check overflow 


G.SUB.U.64.0 


Group subtract unsigned octlets check overflow 


G.SUB.U.128.0 


Group subtract unsigned hexlet check overflow 
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Equivalencies 



G SET EZ 8 


Group set equal zero bytes 


G SETEZ 16 


Group set equal zero doublets 


G SET EZ 32 


Group set equal zero quadlets 


G SET EZ 64 


Group set equal zero octlets 


G SETEZ 128 


Group set equal zero hexlet 


G SET GZ8 


Group set greater zero signed bytes 


G SET GZ 16 


Group set greater zero signed doublets 


G SET G Z 32 ' 


Group set greater zero signed quadlets 


G SET G Z 64 


Group set greater zero signed octlets 


G SET G 7 728 


Group set greater zero signed hexlet 


G SET GE Z 8 


Group set greater equal zero signed bytes 


G SPT GPZ Y6 


Group set greater equal zero signed doublets 


G SFT GP Z 32 


Group set greater equal zero signed quadlets 


G SET GE Z 64 


Group set greater equal zero signed octlets 


G SET GE 7 728 


Group set greater equal zero signed hexlet 


G SPT / 7 8 


Group set less zero signed bytes 


G SET L Z 16 


Group set less zero signed doublets 


G SPT LZ 32 


Group set less zero signed quadlets 


<^ 9PT / 7 84 


Group set less zero signed octlets 


G <ZFT 1 7 198 


Grouo set less zero sioned hexlet 


G 9PT / P 7 8 


Grouo set less eaual zero siqned bytes 


G <?PT/ P 7 76 

U.OL 1 .1—1 — 1 \J 


GrouD set less eaual zero siqned doublets 


G 9PT/ P 7 32 


Group set less equal zero signed quadlets 


G.SET.LE.Z.64 


Group set less equal zero signed octlets 


G.SET.LE.Z.128 


Group set less equal zero signed hexlet 


G.SET.NE.Z.8 


Group set not equal zero bytes 


G.SET.NE.Z.16 


Group set not equal zero doublets 


G.SET.NE.Z.32 


Group set not equal zero quadlets 


G.SET.NE.Z.64 


Group set not equal zero octlets 


G.SET.NE.Z.128 


Group set not equal zero hexlet 
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ocx / r o 

G.SET.LE.o 


/^rnnri cot Ipcc phiia! sinnpd hvtPS 
OiUUL/ ocl (woo c^Udi oiyi iou uy ico 


ocx i c Act 
G.ofc / .Lc. 7 0 


f^rmm spt Ipss pnual sinned doublets 


OCX I c oo 


f^rnun set Ipss pnual sinned ouadlets 


/-\ OCX 1 C fiyf 


f^rmin SPt Ipcc pnual cinnpd OCtletS 

Owl IwOO wlJUOl OIMI ivw W/llwW 


ocx / c -f op 
b.ot 1 .Ltz.l co 


Crnnn set Ipss pnual si aned hexlet 


OCX / £T / / 0 

b.ot /.Lc.U.o 


f^rnun set less eoual unsianed bvtes 

VlvUU Owl IwOw vUVIUI Ui iwiyi iwvj i/jvww 


/■> OCX / C / / 4 

b.ot /.Lfc.L/. 70 


f^rnnn spt less pnual unsianed doublets 

Ol vUU Owl IwOO vVJUQI Ul Iwiyi IwU uwwwiwiw 


OCX 1 C / f oo 


f^rmm set Ipss pnual unsianed ouedlets 

wl vUU Owl IwOO vUjUQI UllOiyilwW ^UUUIUM 


ocx / c / / 


f^rm in cpt Ipss pnual unsianed octlets 

wlUUU Owl IwOO wVJUCII Ul IwlMI Ivvl wwvlwlw 


OCX 1 C / / -f oo 

b.ot /.Lfc.L/. 1 co 


^rnnn spt Ipss pnual unsinned hexlet 

OIUUU Owl IwOO vVJUQI Ul lOiyi IwU MOAIvl 


G.ofc T.G.o 


f^rm m cot cinnoH nroator h\/tps 
oruup owl oiyiiwu yitscjitJi uyiwo 


G.ofc /.G. 76 


firm m cot cinnoH nroptor Hm ihlots 
oiuup owl oiyiiwU yicaiwf uuuuicio 


/"> OCX oo 

G.ofcT.G.o2 


^rnnn cot cinnoH nrpatpr m ipdlpts 
oruup owl oiyiiwU yicaid t^uauicio 


OCX o">< 

G.ofc 7.G. 64 


rirrw m cot cinnoH nroafpr of^tlots 
OlQUp Owl oiyiiwU yi ccalcl Uvllclo 


G. SET. G. 128 


^rfti in cot cinnoH nroator hoYlot 

oruuu owi oiyiiwu yitJaici iicaici 


(j.ot I.G.U.o 


f^mim cpt nrpatpr unsinnpd hvtps I 

OlUUp Owl yiwalwl UllOiyilwu wy ICO 


G.SET.G.U.16 


Group set greater unsigned doublets 


G.SET.G.U.32 


Group set greater unsigned quadlets 


G.SET.G.U.64 


Group set greater unsigned octlets 


G.SET.G.U.128 


Group set greater unsigned hexlet 




G.SET.E.Z.size rd=rc 


<- G.SET.AND.E.size rd=rc,rc 


G.SET.G.Z.size rd=rc 


<= G.SET.L.U.size rd=rc,rc 


G.SET.GE.Z.size rd=rc 


<= G.SET.GE.size rd=rc,rc 


G.SET.LZsize rd-rc 


<t= G.SET.L.size rd=rc,rc 


G.SET.LE.Z.size rd-rc 


<= G.SET.GE.U.size rd=rc,rc 


G.SET.NE.Zsize rd=rc 


<- G.SET.AND.NE.size rd=rc,rc j 


G.SET.G.size rd-rb,rc 


G.SET.L.size rd=rc,rb 


G.SET.G.U.size rd=rb,rc -> G.SET.L.U.size rd=rc,rb 


G.SET.LE.size rd=rb,rc 


-> G.SET.GE.size rd=rc,rb 


G.SET.LE.U.size rd=rb,rc -> G.SET.GE.U.size rd=rc,rb 
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Format 



G.op.size rd=rb,rc 
rd=gopsize(rb,rc) 

31 24 23 18 17 12 11 65 0 

\ G.size I rd I rc I rb | op 

8 6 6 6 6 



Fig. 33B 



D finition 

def GroupReversed(op,size,rd,rc t rb) 
c +- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 
G.SUB: 

for i <r- 0 to 128-size by size 

ai+size-1..i «- bj+size-1 ..i - Ci +S i 2e -i.j 
endfor 
G.SUB.L: 

for i +- 0 to 128-size by size 

t <- (bj+size-1 II bj+size-1. .i) - (Cj+size-1 II Ci+size-1..i) 

aj+size-1..i <- (*size * t S j ze -i) ? (t S jze II t§g£l) : t S j ze -1.. 
endfor 
G.SUB.LU: 

for i <- 0 to 128-size by size 

t <- (0 1 || bj+size-u) - (0 1 || q+size-1..i) 

aj +S ize-1..i <- (tsize * 0) ? 0 size : W1..0 
endfor 
G.SUB.O: 

for i <- 0 to 128-size by size 

t <- (bj+size-1 II bj+size-1. .1) - (Cj+size-1 II Ci+size-1..i) 
if (tsize *tsize-l) then 

raise FixedPointArithmetic 

endif 

aj+size-1..i<-tsize-1..0 
endfor 
G.SUB.U.O: 

for i <- 0 to 128-size by size 

t <- (0 1 || bi +S i Z e-i j) - (0 1 || Ci +size -i..i) 
if (tsize * 0) then 

raise FixedPointArithmetic 

endif 

a i+size-1..i «- *size-1 -.0 
endfor 
G.SET.E: 

for i <- 0 to 128-size by size 

ai+size-1..i <- (bi+size-1..i = Cj+size-1..i) size 
endfor 
G.SET.NE: 

for i <r- 0 to 1 28-size by size 

aj+size-1..i «- (bj+size-1 ..i * Cj+ S j ze -i..j) s ' ze 
endfor 
G.SET.AND.E: 

for i +- 0 to 128-size by size 

aj+size-1..i <- ((bj+size-1 ..i and q+ S ize-1..i) = 0) size 
endfor 

Fig. 33C 



G.SET.AND.NE: 

for i +- 0 to 128-size by size 

aj+size-1 ..i «- ((t>i+size-1 ..i and Cj +S j ze -1 ..i) * 0) s,ze 
endfor 
G.SET.L: 

for i <r- 0 to 1 28-size by size 

aj+size-1. .i «- ((rc = rb) ? (b i+S j ze -i..i < 0) : (bj +S j ze -i..j < q +S j Z e-l..i)) size 
endfor 
G.SET.GE: 

for i <- 0 to 1 28-size by size 

aj+size-1. J <- ((re = rb) ? (bj +S j ze -l..i ^ 0) • (bj+size-1..i ^ Cj +S j ze .i..i)) size 
endfor 
G.SET.LU: 

for i <- 0 to 128-size by size 

aj+size-1. J «- ((re = rb) ? (bj+ S ize-1..i > 0) : 
((0 || b i+si2e .i..i)<(0 ||q +S ize-1..i))) sjze 

endfor 
G.SET.GE.U: 

for i <- 0 to 128-size by size 

aj+size-1 ..i <- ((re = rb) ? (bi +S j ze -i ..j <; 0) : 
((0 II b i+S ize-1..i) * (0 II c i+ si ze -l..i))) slze 

endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 
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F DIV R4 

L..UI V .U*T 


Ensemble divide sianed octlets 


F DIV U 64 


Ensemble divide unsianed octlets 


F MUL 8 


Ensemble multiply signed bytes 


F MUL 16 


Ensemble multiply signed doublets 


F MUL 32 


Ensemble multiDlv sianed auadlets 


F MUL 64 

L_ . 1 VI \J Urn ■ V*T 


Ensemble multiDlv sianed octlets 


F Ml Jl 91 JM ft 

E—.IVI VJl_.OVJIVI.O 


Ensemble multinlv sum sianed bvtes 


F Ml II IM 1R 

CIVIVJL..OUIVI. IU 


Ensemble multinlv sum sianed doublets 


F Ml Jl JM 19 

L-.IVJ VJL.O UIVI.04. 


Ensemble multinlv sum sianed auadlets 


F Ml Jl <5l JM R4 

C.IVIVJL.OVJIVI .UH 


Fnsemhle multinlv sum sianed oetlpts 

lOvlMUIV IllUIUWiy Jul 1 1 Jl^l ICU vV/LlvlO 


p Mill c ft 

L».IVIVJL.V-r.O 


Fnspmhlp onmnlpx multinlv hvtps 

l_i ioci 1 1 uic wi i ipivA iiium^siy uy ico 


F Ml Jl P 1fi 

C. IVl VJl_. w. 1 U 


Fnspmblp romnlpx multinlv douhlpts 

Igvlliuiv wllipiCA 1 1 \\Jt\\.\yJ\j UUUUICIO 


F Mill H 19 


Ensemble comnlex multinlv auadlets 

bl Uwllll/lv wvlllUlw/V IllVJIUWiy VjUuUlvlw 


E MUL M 8 


Ensemble multinlv mixed-sianed bvtes 

uiiwvinwiw iiiuiiiwiy 1 1 iiavu wiyi ivu wyvwo 


F Ml Jl M 16 

^.IVI VJL..IVI. 1 \J 


Ensemble multiDlv mixed-sianed doublets 

Ullwwlllvlw 1 1 1 CI 1 11 \J 1 y 1 1 IIAwU wIMI Iwvl \J \J \J \J 1 w I w 


F MUI M 19 

I_. IVIVJL. IVl ,0£- 


Ensemble multinlv mixed-sianed auadlets 

Ul IwwIIIUIw IllvJIU^Ijf 1 1 H/\wU wIM' Iwvl vjUavllwlw 


F MUI M 64 


Ensemble multinlv mixed-sianed octlets 

L.I Iwvl 1 lUlw lllwllllL/ly 1 1 ll/\w\J wIMI IvU vvllwlw 


F MUL P ft 

L..IVIVJL..I .O 


Ensemble multinlv nolvnomial bvtes 

Imml lOvl 1 llta/IVr lllUIMUiy fJ\Jt J 1 IUI 1 IICII V/Jf IVW 


F Ml II P 16 


Fn^pmhlp multinlv nolvnomial douhlpte 

L-l loCI 1 IL/IC INUILipiy yJVJly 1 Iwl 1 IICII UUUL/ICIO 


F MUI P 19 

C IVl VJL.r.O^ 


Fnspmblp multinlv nolvnomial ouadlpts 

l_l loCI 1 IL/IC IllUUIpiy \J\J\y 1 IUI 1 IICII U,UC1UIClO 


F Mill P 64 

CIVIVJU.i .U*t 


Fn^pmhlp multinlv nolvnomial ortlpts 

L— i loci i iuic iiiuiuuiy yjyjiynsjuuQi uviicio 


F Ml Jl <>l JM C ft 

I VI VJU.OVJ IVl. V_/.0 


Fn^pmhlp multinlv sum oomnlpx bvtp^ 


F Ml II JM C 16 

C.IVIVJL.OVJIVI.V^. IU 


Fn^pmhlp multinlv sum oomnlpx douhlpts 


F Ml II JM P 19 

t- . I VI VJ L . O VJ I VI . V./ . O ^. 


Fn^pmhlp multinlv sum oomnlpx nuadlpte 

U.I IOCI 1 IL/IC IllUIUpiy OUIII wl lipiCA V^UClVJIdO 


F Ml Jl ^IIM M ft 

[_ . IVl VJ L. . O VJ I VI . I VI . o 


Fnsemhlp multinlv sum mixpri-sinnpri hvtps 

u.i ioci i iuiv 1 1 iui uyjiy oumi 1 1 iiavu oiui icu uyico 


F Ml II 9l JM M 16 

L_. IVIVJL. OVJ IVl. IVl. IU 


Fnspmhlp multinlv sum mixpri-sinnpd doublpts 

L.IIOCIIIUIC IllUIU^/iy OUIII 1 1 IIAvU OIUI ICU UUUUICIO 


F Ml Jl ^l JM M 19 

n. . 1 VI VJ L. . O VJ 1 VI . 1 VI . Ot. 


Fnsemhlp multinlv sum mixpd-sionpd nuadlpts 

l_IIOCIIIUIC IIIUILIUiy OUIII 1 1 IIACU OIUI ICU VfUCIUICiO 


F Ml Jl ^1 JM M 64 

l_. IVl VJL.OVJ IVl. IVl. VJ*t 


Fn^pmhlp multinlv Qiim mixpd-^innpd octlpts 

L.IIOCIIIUIC IIIUHIUiy OUIII 1 1 IIACU OIUI ICU vvllvlv 


F MUI QIIMIIR 

L- . IVl VJ I- . O VJ IVl . VJ . o 


Enspmblp multinlv sum unsionpd bvtes 

ui ioci i iwiw iiiuniuiy ouiii ui ioiui icu uyiww 


E MUL SUM U 16 


Ensemble multiply sum unsigned doublets 


E.MUL.SUM.U.32 


Ensemble multiply sum unsigned quadlets 


E.MUL.SUM.U.64 


Ensemble multiply sum unsigned octlets 


E.MULU.8 


Ensemble multiply unsigned bytes 


E.MUL.U.16 


Ensemble multiply unsigned doublets 


E.MULU.32 


Ensemble multiply unsigned quadlets 


E.MULU.64 


Ensemble multiply unsigned octlets 



Fig. 34A 



Format 

E.op.size rd=rc,rb 
rd=eopsize(rc,rb) 

31" 24 23 18 17 12 11 65 0 

I E.size I rd | rc | rb | op 

8 6 6 6 6 



Fig. 34B 



Definition 



def muKsize.h.vs.v.i.ws.wj) as 

mul <- ((vs&v si2e -1+i) h " si2e II vsize-1+i..i) * ((ws&w size -i + j) h " slze II w size -i+j.j) 
enddef 

def c PolyMultiply(size,a,b) as 

p[0]<-0 2 * size 
for k <- 0 to size-1 

p[k+1] <- p[k] * a k ? (0 size " k || b || 0 k ) : 0 2 * slze 

endfor 
c «- p[size] 
enddef 

def Ensemble(op,size,rd,rc,rb) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 

E.MUL, E.MUL.C:, EMULSUM, E.MULSUM.C. E.CON, E.CON.C. E.DIV: 

cs <- bs «- 1 
E.MULM:, EMUL.SUM.M, E.CON.M: 

cs<- 0 

bs<-1 

E.MULU:. EMULSUM.U. E.CON.U, E.DIV.U, E.MULP: 
cs 4- bs 4- 0 

endcase 
case op of 

E.MUL, E.MULU. E.MULM: 

for i <- 0 to 64-size by size 

^2*(i+size)-1..2*i «- mul(size.2*size,cs,c,i.bs,b,i) 

endfor 
E.MULP: 

for i <- 0 to 64-size by size 

d2*(i+size)-1..2*i «- PolyMultiply(size > c S j ze -i+i..i.b S i Z e-i+i.;i) 

endfor 
E.MULC: 

for i <- 0 to 64-size by size 
if (i and size) = 0 then 

p <- mul(size,2*size,1.c,i,1.b,i) - mul(size.2*size,1,c,i+size,1,b,i+size) 

else 

p «- mul(size,2*size,1,c.i,1,b.i+size) + mul(size,2*size,1,c.i,1,b.i+size) 

endif 

d2*(i+size)-1..2*i*-P 

endfor 

E.MULSUM, E.MULSUM.U. E.MULSUM.M: 
p[0]<-0 128 

for i <- 0 to 128-size by size 

pp+size] <- p[i] + mul(size,128,cs.c,i,bs,b,i) 

endfor 
• a*-p[128] 
E.MULSUM.C: 

p[0] <- 0 64 
p[size] <- 0 64 

for i <- 0 to <28-size by size 
if (i ano &ze) = 0 then 

pp-» 2* size] «- p[i] + mul(size,64,1 ,c,i,1 ,b,i) 

- mul(size,64,1 ,c,i+size,1 ,b.i+size) 



pp+2*size] <- p[i] + mut(size,64,1,c,i,1,b t i+size) 

+ multsize^.l.c.i+size.l.b.i) 

endif 

endfor 

a p[128+size] || p[128] 

Fig. 34C 



E.CON, E.CON.U, E.CON.M: 
p[0]<-0 128 

for j «- 0 to 64-size by size 

for i <r- 0 to 64-size by size 

pD+size]2*(j+ S ize)-1..2*i <~ PDl2*(i+size)-1..2*i + 
mu!(size t 2*size,cs,c,i + 64-j,bs,b,j) 

endfor 

endfor 
a <- p[64] 
E.CON.C: 

p[0]<-0 128 

for j <- 0 to 64-size by size 

for i <- 0 to 64-size by size 

if ((H) and j and size) = 0 then 

pD+size] 2 *(j+ S ize)-1..2*i *- PDl2*(i+size>-1..2*i 
mul(size,2*size,1,c,i+64-j,1 j) 



pD+size] 2 *(j+size)-1..2*i «- PDl2*(i+size>-1..2*i 
mui(size,2*size,1 I c t i+64-j+2*size,1,b,j) 

endif 

endfor 

endfor 
a<-p[64] 

E.DIV: 

if (b - 0) or ( (c = (1 1|0 63 )) and (b = 1 64 ) ) then 
a <- undefined 

else 

q<-c/b 

r <- c - q*b 

a «- r 63..0 II P63..0 

endif 
E.DIV.U: 

if b = 0then 

a 4- undefined 



q<-(0 || c)/(0 || b) 
r<-c-<0|| q)*(0 || b) 
a «- r 63..0 II Q63..0 

endif 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

none 



Fig. 34C (cont'd) 



G.C0M.AND.E.8 


oroup compare ana equal zero Dyies 


G.COM.AND.E.16 


oroup compare ana equal zero aouuieis 


G.COM.AND.E.32 


oroup compare ano equal zero quauieis 


G.COM.AND.E.64 


oroup compare ano equal zero ocuexs 


G.COM.AND.E.128 


oroup compare anu equal zero riexiei 


G.COM.AND.NE.o 


oroup compare anu nui t?quai z.&\v uyiuo 


G.C0M.AND.NE.16 


oroup compare ana noi equal zero aouoieis 


Am « a i in Kir o o 

G.COM.AND.NE.32 


oroup compare ana noi equal zero quauieis 


G.COM.AND.NE.64 


oroup compare ano noi equal zero ocueis 


G.COM.AND.NE.128 


m AAmAAPA An<J r% t 1 IaI "TATA hAvlAf 

oroup compare ana noi equal zero nexiei 


G.C0M.E.8 


Group compare equal bytes 


G.C0M.E.16 


Group compare equal doublets 


G.COM.E.32 


Group compare equal quadlets 


G.COM.E.64 


Group compare equal octlets 


G.COM.E.128 


Group compare equal hexlet 


G.C0M.GE.8 


Group compare greater equal signed bytes 


G.C0M.GE.16 


Group compare greater equal signed doublets 


G.COM.GE.32 


Group compare greater equal signed quadlets 


G.COM.GE.64 


Group compare greater equal signed octlets 


G.COM.GE.128 


Group compare greater equal signed hexlet 


G.C0M.GE.U.8 


Group compare greater equal unsigned bytes 


G.C0M.GE.U.16 


Group compare greater equal unsigned doublets 


/""\ ft ft ^> 1 ■ 

G.COM.GE.U.32 


Group compare greater equal unsigned quadlets 


G.COM.GE.U.64 


Group compare greater equal unsigned octlets 


G.COM.GE.U.128 


Group compare greater equal unsigned hexlet 


*-\ /~\ ft ft | o 

G.C0M.L.8 


Group compare signed less bytes 


G.C0M.L.16 


Group compare signed less doublets 


G.COM.L32 


Group compare signed less quadlets 


/"^ /*"\ ft ft ■ r% ft 

G.COM.L64 


Group compare signed less octlets 


ft ft ■ ^ <"*0 

G.COM.L.128 


Group compare signed less hexlet 


/""\/""\ft ft 1 1 1 o 

G.C0M.LU.8 


Group compare less unsigned bytes 


y"\ ft ft ■ ■ i 

G.C0M.L.U.16 


Group compare less unsigned doublets 


G.COM.LU.32 


Group compare less unsigned quadlets 


G.COM.L.U.64 


Group compare less unsigned octlets 


G.COM.L.U.128 
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oroup compare less unsigned nexiet 


vj.UUM.iNt.O 


oil/up lAJHipdiw nui Cw|uai uyi\?o 


G.C0M.NE.16 


Group compare not equal doublets 


G.COM.NE.32 


Group compare not equal quadlets 


G.COM.NE.64 


Group compare not equal octlets 


G.COM.NE.128 


Group compare not equal hexlet 



Fig. 35A 



Format 



G.COM.op.size rd.rc 
G.COM.opz.size red 

gcomopsize(rd,rc) 

31 24 23 18 17 12 11 65 0 

I G.size | rd | rc | op | GCOM | 

8 6 6 6 6 



Fig. 35B 



Definition 



def GroupCompare(op f size,rd t rc) 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
case op of 

G.COM.E: 

for i <— 0 to 128-size by size 

aj+size-1..i <- (dj+size-1..i = Ci +S ize-1..i) sl2e 
endfor 
G.COM.NE: 

for i <- 0 to 128-size by size 

aj+size-1..i <- Wi+size-U * Cj+size-1..i) si2e 
endfor 
G.COM.AND.E: 

for i <- 0 to 128-size by size 

ai+size-1..i <- ((C|+size-1..i and dj +S ize-1 j) = 0) size 
endfor 
G.COM.AND.NE: 

for i <- 0 to 1 28-size by size 

aj+size-1..i <- ((Ci+ S ize-1..i and dj +S j Z e-1..i) * 0) size 
endfor 
G.COM.L: 

for i <- 0 to 128-size by size 

aj+size-1..i <- ((I'd = rc) ? (c i+S jze-1..i < 0) : (dj +S jze-1..i < Cj +S ize-1..i)) slze 
endfor 
G.COM.GE: 

for i <- 0 to 1 28-size by size 

aj+size-1 J «- ((rd = rc) ? (c i+S ize-1 .J * 0) : (d i+S jze-1 J * c i+si ze-i ..i)) size 
endfor 
G.COM.LU: 

for i <- 0 to 128-size by size 

ai+size-1J <- ((rd = rc) ? (q+ S ize-1..i > 0) : 
((0 || d +S ize-1..i)<(0 ||q +S ize-1..i))) size 

endfor 
G.COM.GE.U: 

for i «- 0 to 128-size by size 

aj +S i Z e-i j <- ((rd = rc) ? (q+ S ize-1 ..i * 0) : 
((0 || df+size-u) * (0 || c l+S ize-1..i))) si2e 

endfor 

endcase 
if (a * 0) then 

raise FixedPointArithmetic 

end if 
encidef 



Exceptions 

Fixed-point arithmetic 
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E LOG MOST 8 


Ensemble log of most significant bit signed bytes 


E LOG MOST 16 


Ensemble log of most significant bit signed doublets 


E LOG MOST 32 


Ensemble log of most significant bit signed quadlets 


E LOG MOST 64 


Ensemble log of most significant bit signed octlets 


E LOG MOST 128 


Ensemble loa of most sianificant bit sianed hexlet 


E LOG MOST U 8 


Ensemble loa of most sianificant bit unsianed bvtes I 


E LOG MOST U 16 


Ensemble loa of most sianificant bit unsianed doublets 


E LOG MOST U 32 


Ensemble loa of most sianificant bit unsianed auadlets 


E LOG MOST U 64 


Ensemble loa of most sianificant bit unsianed ortlets 


E LOG MOST U 128 


Ensemble Ion of most sianificant hit tinsinneri heylet 


E SUM 8 


Ensemble sum sinned hvtes 

^IIOCIIik/lv OUI 1 1 vIMI IwU U j ICO 


E SUM 16 


Ensemble sum sinned doublets 

Uil IUVI 1 lUlw wUIII vlUI IwU UVUUlUlw 


E.SUM.32 


Ensemble sum signed quadlets 


E.SUM.64 


Ensemble sum signed octlets 


E.SUM.U.1 


Ensemble sum unsigned bits 


E.SUM.U.8 


Ensemble sum unsigned bytes 


E.SUM.U.16 


Ensemble sum unsigned doublets 


E.SUM.U.32 


Ensemble sum unsigned quadlets 


E.SUM.U.64 


Ensemble sum unsigned octlets 



Selection 



class 


op 


size 


sum 


SUM 


8 16 32 64 


SUM.U 


1 8 16 32 64 


log most 
significant bit 


LOG.MOST LOG.MOST.U 


8 16 32 64 128 



Fig. 36A 



Format 

E.op.size rd=rc 
rd=eopsize(rc) 

31 24 23 18 17 12 11 6 5 0 

I E.size | rd | rc | op | E.UNARY | 

8 6 6 6 6 



Fig. 36B 



Definition 



def EnsembleUnary(op,size,rd f rc) 
c<- RegRead(rc f 128) 
case op of 

E.LOG.MOST: 

for i <- 0 to 128-size by size 
if (Cj+size-1..i=0)then 

a i+size-1..i <- -1 

else 

for j 4-0 to size-1 

if Csize-1+i..j+i = (cfiiil^i || not c size _ 1+l ) then 
a i+size-1..i<*-j 

endif 
endfor 

endif 
endfor 
E.LOG.MOSTU: 

for i <- 0 to 1 28-size by size 
if (cj+size-L.i^OJthen 
a i+size-1..i *- "1 

else 

forj<-0to size-1 

if Csize-1+i..j+i = (0 sjze - 1 -j || 1) then 
a i+size-1..i<-j 

endif 
endfor 

endif 
endfor 
E.SUM: 

p[0]<-0 128 

for i <- 0 to 128-size by size 

p[i+size] <- p[i] + (c^ije || c S j Z e-1+Li) 
endfor 
a<-p[128] 
E.SUMU: 

p[0] <- 0 128 

for i <- 0 to 128-size by size 

p[i+size] <- p[i] + (0128-size |, Csjze -1 +U ) 
endfor 
a«-p[128] 

endcase 

RegWrite(rd, 128,a) 
enddef 

Exceptions 

none 



Fig. 36C 



Floating-point function Definitions 

def eb <- ebits(prec) as 
case pref of 



16: 






eb <- 5 


32: 






eb<-8 


64: 






eb<- 11 


128: 






eb«- 15 



endcase 
enddef 

def eb <- ebias(prec) as 

eb 0 || iebits(prec)-1 
enddef 

def fb 4- fbits(prec) as 

fb <~ prec - 1 - eb 
enddef 

def a <r- F(prec, ai) as 
a.s +- aip r ec-1 
ae 4- ai prec -2..fbits(prec) 

af<-aifbits(prec)-1..0 
ifae=1 ebite (P rec )then 
if af = 0 then 

a.t <- INFINITY 
elseif affbits(prec)-1 *hen 
a.t <- SNaN 
a.e <- -fbits(prec) 
a.f<-1||affbits(prec)-2..0 

else 

a.t <- QNaN 
a.e «- -fbits(prec) 
a.f <- af 

endif 

Fig. 37 



etseif ae = 0 then 
if af = 0 then 

a.t <- ZERO 

else 

a.t <- NORM 

a.e<- 1-ebias(prec)-fbits(prec) 
a.f ^- 0 || af 

endif 

else 

a.t *- NORM 

a.e ae-ebias(prec)-fbits(prec) 
a.f <- 1 || af 

endif 
enddef 

def a *- DEFAULTQNAN as 

a.s<-0 

a.t <- QNAN 

a.e <- -1 

a.f<-1 
enddef 

def a <- DEFAULTSNAN as 

a.s<-0 

a.t <r- SNAN 

a.e <--1 

a.f<-1 
enddef 

def fadd(a.b) as faddr(a.b.N) enddef 

def c faddr(a,b,round) as 

if a.t=NORM and b.t=NORM then 

// d,e are a,b with exponent aligned and fraction adjusted 
if a.e > b.e then 
d «- a 
e.t <- b.t 
e.s <- b.s 
e.e «- a.e 

e.f<-b.f||O ae " be 
else if a.e < b.e then 
d.t <- a.t 
d.s <- a.s 
d.e <- b.e 
d.f<-a.f || o b - e " a - e 
e<- b 

endif 
c.t <- d.t 
c.e <- d.e 
if d.s = e.s then 

c.s *- d.s 

c.f <- d.f + e.f 
elseif d.f > e.f then 

c.s «- d.s 

c.f <- d.f -e.f 



Fig. 37 (cont'd) 



elseif d.f < e.f then 
c.s «- e.s 
c.f e.f- d.f 

else 

c.s «- r=F 
at <- ZERO 

endif 

// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 
c <- b 

elseif (a.t=SNAN) or (a.t=QNAN) then 
C4-a 

elseif a.t=ZERO and b.t=ZERO then 
at <- ZERO 

c.s <- (a.s and b.s) or (round=F and (a.s or b.s)) 
// NULL values are like zero, but do not combine with ZERO to alter sign 
elseif a.t=ZERO or a.t=NULL then 

c <- b 

elseif b.t=ZERO or b.t=NULL then 

q 4 g 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c <- DEFAULTSNAN // Invalid 

else 

c <- a 

endif 

elseif a.t=INFINITY then 

q 4 g 

elseif b.t=INFINITY then 
c <- b 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 



def b <- fneg(a) as 
b.s <~ -a.s 
b.t<-a.t 
b.e <- a.e 
b.f<-a.f 

enddef 



def fsub(a.b) as fsubr(a,b,N) enddef 

def fsubr(a,b,round) as faddr(a,fneg(b),round) enddef 

def frsub(a.b) as frsubr(a,b,N) enddef 

def frsubr(a,b,round) as faddr(fneg(a),b f round) enddef 

def c <- fcom(a,b) as 

if (a.t=SNAN) or (a.t=QNAi i) or (b.t=SNAN) or (b.t=QNAN) then 
c<-U 

elseif a.t=INFINITY and b.t=INFINITY then 
if a.s * b.s then 

c <r- (a.s=0) ? G: L 



Fig. 37 (cont'd) 



else 

c«-E 

endif 

elseifa.t=INFINITYthen 

c <- (a.s=0) ? G: L 
elseif b.t=INFINITY then 

c«-(b.s=0)?G:L 
elseif a.t=NORM and b.t=NORM then 

if a.s * b.s then 

c <- (a.s=0) ? G: L 

else 

if a.e > b.e then 
af <- a.f 

bf<-b.f ||(>a.e-b.e 

else 

af ^- a.f || o be " ae 
bf<-b.f 

endif 

ifaf = bfthen 
c<-E 

else 

c«-((a.s=0) A (af>bf))?G:L 

endif 

endif 

elseif a.t=NORM then 

c <- (a.s=0) ? G: L 
elseif b.t=NORM then 

c <- (b.s=0) ? G: L 
elseif a.t=ZERO and b.t=ZERO then 

c<- E 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 



def c <- fmul(a,b) as 

if a.t=NORM and b.t=NORM then 

c.s <- a.s A b.s 

c.t <- NORM 

c.e <- a.e + b.e 

c.f<-a.f*b.f 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s «- a.s A b.s 

c.t<-b.t 

c.e <- b.e 

c.f<-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s <- a.s A b.s 
at <- a.t 
c.e <- a.e 
c.f *- a.f 

elseif a.t=2ERO and b.t=INFINITY then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=ZERO then 

c <- DEFAULTSNAN // Invalid 



Fig. 37 (cont'd) 



elseif a.t=ZERO or b.t=ZERO then 
c.s <- a.s A b.s 
c.t <- ZERO 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def c <- fdivr(a.b) as 

if a.t=NORM and b.t=NORM then 
c.s <- a.s A b.s 
c.t <- NORM 
c.e <- a.e - b.e + 256 

c.f<-(a.f II 0 256 )/b.f 
// priority is given to b operand for NaN propagation 
elseif (b.t=SNAN) or (b.t=QNAN) then 

c.s <- a.s A b.s 

c.t <- b.t 

c.e <- b.e 

c.f<-b.f 

elseif (a.t=SNAN) or (a.t=QNAN) then 
c.s <- a.s A b.s 
c.t<-a.t 
c.e <- a.e 
c.f <- a.f 

elseif a.t=ZERO and b.t=ZERO then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=INFINITY and b.t=INFINITY then 

c <- DEFAULTSNAN // Invalid 
elseif a.t=ZERO then 

c.s <r- a.s A b.s 

c.t <- ZERO 
elseif a.t=INFINITY then 

c.s <- a.s A b.s 

c.t <- INFINITY 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

def msb <- findmsb(a) as 

MAXF 2 18 // Largest possible f value after matrix multiply 
forj<-OtoMAXF 

if 3MAXF-1 ..j = (OMAX' 1 - 1 "] || 1) then 
msb «-j 

endif 
endfor 
enddef 



def ai <- PackF(prec,a,round) as 
case a.t of 
NORM: 

msb <- findmsb(a.f) 

m msb-l-fbits(prec) // Isb for normal 

rdn <- -ebias(prec)-a.e-1-fbits(prec) // Isb if a denormal 

rb (m > rdn) ? m : rdn 
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if rb ^ 0 then 

aifr<-a.f ms b-i..o II 0-* 
eadj <- 0 

else 

case round of 
C: 

s <- o™d>fo || (-a.s)' 5 

F: 

s <- 0™$b-rt> || (a.s)* 
N, NONE: 

s<-O msb -*||~a.frbl|a.ffr 1 

X: 

if a.frb-L.o^Othen 

raise FloatingPointArithmetic // Inexact 

endif 
s <- 0 

Z: 

s<-0 

endcase 

v^-(0||a.f msb .. 0 ) + (0||s) 
ifv msb = 1 then 

aifr^-v ms b-i..rb 

eadj <- 0 

else 

aifr^-O^P^) 
eadj <- 1 

endif 

endif 

aien <- a.e + msb - 1 + eadj + ebias(prec) 
if aien <, 0 then 

if round = NONE then 

ai <r- a.s || o ebits (P rec > || aifr 

else 

raise FloatingPointArithmetic //Underflow 

endif 

elseif aien ;> lebits(prec) fhm 
if round = NONE then 

//default: round-to-nearest overflow handling 
ai <- a.s || lebits(prec) || o^terec) 

else 

raise FloatingPointArithmetic //Underflow 

endif 

else 

ai <- a.s || aien e bits(prec)-1..0 II aifr 

endif 
SNAN: 

if round * NONE then 

raise FloatingPointArithmetic //Invalid 

endif 

if -a.e < fbits(prec) then 

ai <- a.s || lebits(prec) || a .f. a .e-1..0 II O*" 8 *™ 5 )*" 

Fig. 37 (cont'd) 



else 

Isb <r- a.f. a .e-1-fbits(prec)+1..0 * 0 

ai <- a.s || lebits(prec) „ a.f. a .e-1..-a.e.1.fbits(prec)+2 li isb 

endif 
QNAN: 

if -a.e < fbits(prec) then 

ai «- a.s || lebits(prec) y a .f. a e _ 1 0 1| 0 ft»ts(prec)+a.e 

else 

Isb <- a.f. a .e-1-fbits(prec)+1..0 * 0 

ai <- a.s || lebits(prec) g a.f. a .e-1..-a.e.1.fbits(prec)+2 II Isb 

endif 
ZERO: 

ai *- a.s || o ebits (P rec ) || o fblts (P re c) 
INFINITY: 

ai «- a.s || i©bits(prec) y Qfbits(prec) 

endcase 
defdef 

def ai <- fsinkr(prec, a, round) as 
case a.t of 
NORM: 

msb <r- findmsb(a.f) 
rb <- -a.e 
if rb <, 0 then 

aifr <~ a.f ms b..O II O"* 
aims <r- msb - rb 

else 

case round of 
CCD: 

s <- 0™$ b -rt> || (-ai.s)' 5 
F, F.D: 

s <- 0™b-rb || (ai s) rb 
N, NONE: 

s <- o msb - rb || -ai.ffb || ai.ffc 1 

X: 

if ai.frt>-i ..o * 0 then 

raise FloatingPointArithmetic // Inexact 

endif 

S4-0 

Z, Z.D: 

s<-0 

endcase 

v^(0||a.f ms b..o) + (0||s) 

* v msb = 1 th © n 

aims <- msb + 1 - rb 

else 

aims <- msb - rb 

endif 

aifr <- v a ims..rb 

endif 

if aims > prec then 
case round of 

CD, F.D, NONE, Z.D: 

ai <r- a.s || (-as)P re(>1 

Fig. 37 (cont'd) 



C, F, N, X, Z: 

raise FloatingPointArithmetic // Overflow 

endcase 
elseif a.s = 0 then 
ai <- aifr 

else 

ai <r- -aifr 

endif 
ZERO: 

aj <- 0P rec 
SNAN, QNAN: 

case round of 

CD, F.D, NONE, Z.D: 

a» <- 0P rec 
C, F, N, X, Z: 

raise FloatingPointArithmetic // Invalid 

endcase 
INFINITY: 

case round of 

CD, F.D, NONE, Z.D: 

ai <- a.s || (-as)P rec " 1 
C, F, N,X, Z: 

raise FloatingPointArithmetic // Invalid 

endcase 

endcase 
enddef 

def c <- frecrest(a) as 
b.s<-0 
b.t <- NORM 
b.e<-0 
b.f <-1 

c <- fest(fdiv(b,a)) 
enddef 

def c *- frsqrest(a) as 
b.s «- 0 
b.t <- NORM 
b.e<-0 
b.f<-1 

c <- fest(fsqr(fdiv(b,a))) 
enddef 

def c <- fest(a) as 

if (a.t=NORM) then 

msb <- findmsb(a.f) 
a.e <- a.e + msb - 13 
a.f<-a.f mS b..msb-12ll 1 

else 

c <- a 

endif 
enddef 

def c <- fsqr(a) as 

if (a.t=NORM) and (a.s=0) then 
c.s <- 0 
c.t <- NORM 
if (a.eo = 1)then 

Fig. 37 (cont'd) 



c.e<-(a.e-127)/2 
c.f<-sqr(ai ||0 127 ) 

else 

c.e<-(a.e-128)/2 
c.f<-sqr(a.f ||0 128 ) 

endif 

elseif (a.t=SNAN) or (a.t=QNAN) or a.t=ZERO or ((a.t=INFINITY) and (a.s=0)) then 

C 4 3 

elseif ((a.t=IMORM) or (a.t=INFINITY)) and (a.s=1) then 
c <r- DEFAULTSNAN // Invalid 

else 

assert FALSE // should have covered al the cases above 

endif 
enddef 

Fig. 37 (cont'd) 



E.ADD.F.16 


Ensemble add floating-point half 


E.ADD.F.16.C 


Ensemble add floating-point half ceiling 


E.ADD.F.16.F 


Ensemble add floating-point half floor 


E.ADD.F.16.N 


Ensemble add floating-point half nearest 


E.ADD.F.16.X 


Ensemble add floating-point half exact 


E.ADD.F.16.Z 


Ensemble add floating-point half zero 


E.ADD.F.32 


Ensemble add floating-point single 


E.ADD.F.32.C 


Ensemble add floating-point single ceiling 


E.ADD.F.32.F 


Ensemble add floating-point single floor 


E.ADD.F.32.N 


Ensemble add floating-point single nearest 


E.ADD.F.32.X 


Ensemble add floating-point single exact 


E.ADD.F.32.Z 


Ensemble add floating-point single zero 


E.ADD.F.64 


Ensemble add floating-point double 


E.ADD.F.64.C 


Ensemble add floating-point double ceiling 


E.ADD.F.64.F 


Ensemble add floating-point double floor 


E.ADD.F.64.N 


Ensemble add floating-point double nearest 


E.ADD.F.64.X 


Ensemble add floating-point double exact 


E.ADD.F.64.Z 


Ensemble add floating-point double zero 


E.ADD.F.128 


Ensemble add floating-point quad 


E.ADD.F.128.C 


Ensemble add floating-point quad ceiling 


E.ADD.F.128.F 


Ensemble add floating-point quad floor 


E.ADD.F.128.N 


Ensemble add floating-point quad nearest 


E.ADD.F.128.X 


Ensemble add floating-point quad exact 


E.ADD.F.128.Z 


Ensemble add floating-point quad zero 


E.DIV.F.16 


Ensemble divide floating-point half 


E.DIV.F.16.C 


Ensemble divide floating-point half ceiling 


E.DIV.F.16.F 


Ensemble divide floating-point half floor 


E.DIV.F.16.N 


Ensemble divide floating-point half nearest 


E.DIV.F.16.X 


Ensemble divide floating-point half exact 


E.DIV.F.16.Z 


Ensemble divide floating-point half zero 


E.DIV.F.32 


Ensemble divide floating-point single 


E.DIV.F.32.C 


Ensemble divide floating-point single ceiling 


E.DIV.F.32.F 


Ensemble divide floating-point single floor 


E.DIV.F.32.N 


Ensemble divide floating-point single nearest 


E.DIV.F.32.X 


Ensemble divide floating-point single exact 


E.DIV.F.32.Z 


Ensemble divide floating-point single z^ro 


E.DIV.F.64 


Ensemble divide floating-point double 



Fig. 3° A 



r— r\i\ / r~ o a f> 

E.DIV.F.o4.C 


tnsemDie aiviae Tioaung-point oouDie ceiling 


t.DIV.F.o4.r 


tnsemDie aiviae Tioaiing-point douoie tioor 


fc.UIV.r.o4.l\l 


tnsemDie aiviae Tioating-poini aouDie nearest 


b.UIV.r.o4.A 


tnsemDie aiviae tioaiing-point aouDie exact 


c r\i\/ c ciA 7 
c.UIV.r.b4.*l 


tnsemDie aiviae lioating-point aouDie zero 


b.UIV.r.12o 


tnsemDie aiviae Tioating-point quad 


E.DIV.F.128.C 


tnsemDie aiviae tioating-point quad ceiling 


E.DIV.F.12o.F 


cnsemDie divide floating-point quad floor 


r— r-vi\ / r- 400 Kl 

E.DIV.F.128.N 


Ensemble divide floating-point quad nearest 


E.DIV.F. 128.X 


Ensemble divide floating-point quad exact 


E.DIV.F.128.Z 


Ensemble divide floating-point quad zero 


E.MULC.F.16 


Ensemble multiply complex floating-point half 


E.MULC.F.32 


Ensemble multiply complex floating-point single 


E.MULC.F.64 


Ensemble multiply complex floating-point double 


r k mi ii r~ a & 

E.MULF.16 


Ensemble multiply floating-point half 


r- i ii || i— a ry f\ 

E.MULF.16.C 


Ensemble multiply floating-point half ceiling 


I— iii ii r— a ry ^ 

E.MUL.F.16.F 


Ensemble multiply floating-point half floor 


1 — i ii || r- *i o Kl 

E.MULF.16.N 


Ensemble multiply floating-point half nearest 


^ & ji ii r- a o v/ 

E.MUL.F.16.X 


Ensemble multiply floating-point half exact 


I - ft J | || r- A r> ~7 

E.MUL.F.16.Z 


Ensemble multiply floating-point half zero 


r* r ii ii r— oo 

E.MULF.32 


Ensemble multiply floating-point single 


r— ii| || r— oo 

E.MULF.32.C 


Ensemble multiply floating-point single ceiling 


p— ft l| || I" oo ^ 

E.MULF.32.F 


Ensemble multiply floating-point single floor 


^ ft j i ii r~ oo ft i 

E.MULF.32.N 


Ensemble multiply floating-point single nearest 


r~ ft 1 1 II |""~ OO V/ 

E.MULF.32.X 


Ensemble multiply floating-point single exact 


I - ft A 1 II I - OO "7 

E.MULF.32.Z 


Ensemble multiply floating-point single zero 


r— ft j | || r- o j| 

E.MULF.64 


Ensemble multiply floating-point double 


^ ft 4i ii r~ Oil 

E.MULF.64.C 


Ensemble multiply floating-point double ceiling 


^ ft ai ii r~ Oil ^ 

E.MULF.64.F 


Ensemble multiply floating-point double floor 


^ ft 41 ii n o ii ft i 

E.MUL.F.64.N 


Ensemble multiply floating-point double nearest 


p— ii| || f— Oil v/ 

E.MULF.64.X 


Ensemble multiply floating-point double exact 


r*~ ft 4i ii i~ i 

E.MULF.64.Z 


Ensemble multiply floating-point double zero 


P Ml II P 1 OA 

civiUL.r. izo 


PncamKIa mi ilfiolw flotation nnint oi ■ o r\ 

tnsemDie multiply Tioaiing-pomi quau 


E.MULF.128.C 


Ensemble multiply floating-point quad ceiling 


E.MULF.128.F 


Ensemble multiply floating-point quad floor 


E.MULF.128.N 


Ensemble multiply floating-point quad nearest 


E.MULF.128.X 


Ensemble multiply floating-point quad exact 


E.MULF.128.Z 


Ensemble multiply floating-point quad zero 



Fig. 38A (cont'd) 



Selection 



class 


op 


prec 


round/trap 


add 


EADDF 


16 32 64 128 


NONE C F N X Z 


divide 


EDIVF 


16 32 64 128 


NONE C F N X Z 


multiply 


EMULF 


16 32 64 128 


NONE C F N X Z 


complex multiply 


EMUL.C 
F 


16 32 64 


NONE 



Format 

E.op.prec.round rd=rc,rb 
rd=eopprecround(rc,rb) 

31 24 23 18 17 12 11 65 0 

f~ E.prec | rd | re | rb | op.round \ 

8 6 6 6 6 



Fig. 38B 



Definition 

defmul(siz .vj.wjjas 

mu! <- fmul(F(si2e,Vsize-1+i. j).f r (size,w S ize-1+j..j)) 
enddef 

def EnsembleFloatingPoinUop^rec.round.ra.rb/c) as 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i <r- 0 to 128-prec by prec 
ci<-F(prec,Ci +P rec-1..i) 
bi<-F(prec,bj +pr ec-l..i) 
case op of 
E.ADD.F: 

ai <- faddr(ci,bi f round) 
E.MUL.F: 

ai fmul(ci f bi) 
E.MUL.C.F: 

if (i and prec) then 

ai <- fadd(mul(prec,c,i,b f i-prec), muKprec.ci-precbJ)) 

else 

ai <- fsub(mul(prec,c,l,b,l) f mul(prec,c,i+prec,b f i+prec)) 

end if 
E.DIV.F.: 

ai <- fdiv(ci.bi) 

endcase 

a i+prec-1..i <- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 38C 



Operation codes 



F MUL ADD CF 1fi 


Ensemble multiDlv add comnlex floatina-Doint half 


E MUL ADD C F 32 


Ensemble multiDlv add comDlex floatina-Doint sinale 


F MUL ADD C F 64 


Ensemble multiDlv add comDlex floatina-Doint double 


E MUL ADD F 16 


Ensemble multiDlv add fioatina-Doint half 


E MUL ADD F 16 C 


Ensemble multiDlv add floatina-Doint half rpilinn 

L>l IwvMIUIw IIIVJIUL^IY UUvJ llvCIUI IU WWII 11 1 lull VsClllliy 


E MUL ADD F 16 F 


Ensemble multiDlv add floatina-noint half floor 


F Ml Jl ADD F 16 M 

CIViUL./AL/L'.l . IU.IN 


Fnsemblp miiltinlv/ add floati nn-nnint half noaroct 

i — i iovi 1 1 uic iiiuiiipiy auu iiwauiiy l/uiiii iidii iicdicol 


p Ml Jl ADD F 16 X 


Pn^pmhlp multinlv aHH flnati nn-nnint half ovort 
l_i iwvi i iuic iiivJiUL/iy auu iiuaui ly uuii u iidil CAdUl 


f mi ii Ann p ift 7 


PnQPmhlp multinlv/ aHH flnatinn.nnint half 70m 
l_i loci i iuic iiiuiuuiy dUU livjdlll ly-pun ii Hall Z.ciU 


F Ml II Ann F 10 


PnQPmhlp multinlv/ aHH flnati nn-nnint cinnlo 
t.i ioci i iuic iiiuuipiy auu iiuduny-puiiii oillylc 


P mi ii Ann p^9p 


Pncomhlp miiltinlv/ aHH flnatinn.nnint c inn lo r-c*\\tnr% 

c_i ioci i iuic multiply auu iiuauiiy-puim oinyic Celling 


F Ml II Ann F ?9 F 


PnoomhJp multinlv/ aHH flnptinn.nnint cinnlo flnrtr 
l.1 ioci 1 1 Kfivs iiiuiujjiy auu iil/ciiii ly uuii u oiiiyit? nuui 


F Ml Jl Ann P 79 M 


Pn^pmhlp multinlv/ flHH flnati nn-nnint cinnlo noaroct 
L-i locniutc niuiuuiy auu iiuani lyuuiiu olliyio iicaltJol 


f mi ii Ann F 79 X 

L_.IVIvJl_./AL/L/.l . OZ. ./\ 


Pn^pmhlp multinlv/ add flnptinn-nnint cinnlo ovart 
^.i ioci i luic? iiiuiuuiy auu iivjaiiny uuii u oil lyit? (;AaUl 


p mi ii Ann P 79 7 

CZ.IVIUI nUU.r.OZ.L 


Fncomhlo miiltinlv/ oHH flnotinn_nnint cinnlo 7am ' 

i_i looii iuic inuiupiy duu iiudiii ly-puiiu 0111916 zero 


f mi ii Ann F RA 


Pncpmhlp multinlv/ aHH flnati nn-nnint HniiKlo 
i—iiodiiijic iiiuiiipiy duu iiuaiii ly-puii u uuuuic 


F Ml Jl Ann F 64 C 


Pncpmhlp multinlv/ aHH flnatinn-nnint Hnnhlo noilinn 


F Ml II Ann F 64 F 
C IVI KJ u .r\U U . i .D*t . i 


PnQPmhlp multinlv/ aHH flnati nn-nnint Hniihlo flnnr 
a loci 1 iuic iiiuiii|jiy auu nuain ly-pun 11 uuuuic nuur 


P Ml II Ann P f\A M 
C .IVIUL.MLIU.r.D*f .IN 


Pncomhlo mi iltinK/ aHH flnoti nn nnint Hm iKIa naoract 
[-llociilUlc iTIullipiy auu IIUdUMy-pUini UOUDI6 11601601 


p mi ii Ann f ftii y 

C.IVlUL.MUU.r.D^.A 


F-ncorrthlo mi iltinl\# orlH flnof inn rv%Snt rAr\t iKIa avopf 

l_iiociiiuiu rnuiupiy auu iiuauny-poini aouDie exaci 


F Ml II Ann PR4 7 


PnQPmKlo multinlv/ oHH flnatinn.nnint Hnnhla 70m 

c_i loci 1 iuic iiiuiupiy duu iiuaiif ly-poini ciouuie zero ,» 


F Ml II Ann F 19fl 

CIVIUL./AUL/.r . IZO 


FnQPmhlo miiltinlv/ aHH flnatinn.nnint miaH 
U.110C111UIC iiiuiupiy duu iiudiu ly -jjuii 11 ijUdu 


F Ml II Ann F 19ft P 


PncPmHio miiltinlv/ aHH flnatinn.nnint nnoH noilinn 

L-i loci uuic iiiuiupiy auu iioauriy*poini ijUaU Gciiiny 


F Ml Jl Ann F 19ft F 


PnQPmhlp miiltinlv/ aHH flnatinn.nnint nnaH f\r\r\r 
L_iiociiiUic iiiuiuuiy auu IIUalliiy~poini l^UaU iioor 


F Ml II Ann F 19ft M 


Pncpmhlp miiltinlv/ aHH flnatinn.nnint nnaH no a roc t 

L.110C111UIC iiiuiuuiy duu iiudiu iy~uuini tfuau ncdicoi 


F Mill Ann F 19ft X 

t- . IVI UL.nUL/.r . I ZO./\ 


Pncpmhlp multinlv/ aHH flnatinn.nnint nnaH ovant 
l.i ioci 1 il/ic iiiuiuuiy auu nuaui lyuuuii LjUdU cAdOL 


F Ml Jl Ann F 19ft 7 


Fn<?pmhlp multinlv/ add flnati nn-nnint nnaH 70m 
i_i iochiuic iiiuiuuiy auu iiuauiiu uumi uudu zciu 


E.MULSUB.C.F.16 


Ensemble multiply subtract complex floating-point half 


E.MULSUB.C.F.32 


Ensemble multiply subtract complex floating-point single 


E.MUL.SUB.C.F.64 


Ensemble multiply subtract complex floating-point double 


E.MULSUB.F.16 


Ensemble multiply subtract floating-point half 


E.MULSUB.F.32 


Ensemble multiply subtract floating-point single 


E.MULSUB.F.64 


Ensemble multiply subtract floating-point double j 


E.MULSUB.F.128 


Ensemble multiply subtract floating-point quad 



Fi?. 38D 



S I ction 



class 


op 


type 


prec 


round/trap 


multiply add 


E.MULAD 
D 


F 


16 32 64 128 


noneCFNXZ 






C.F 


16 32 64 


NONE 


multiply subtract 


E.MUL.SU 
B 


F 


16 32 64 128 


NONE 






C.F 


16 32 64 


NONE 



Format 



E.op.size rd@rc,rb 
rd=eopsize(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I E.size I rd | rc | rb | op 

8 6 6 6 6 



Fig. 38E 



1 



Definition 

def muKsize.vj.wj) as 

mul <r- fmul(F(size l v S i ze -i+i..i),F(size l w s i ze -i+j.j)) 
enddef 

def EnsemblelnplaceFloatingPoint(op,size,rd,rc,rb) as 
d 4- RegRead(rd t 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for i ^- 0 to 128-size by size 
di<-F(prec,di +pr ec.1..i) 
case op of 

E.MULADD.F: 

ai <- fadd(di, mul(prec,c,i,b,i)) 
E.MULADD.C.F: 

if (i and prec) then 

ai <- fadd(di f fadd(mul(prec,c ( i,b,i-prec), mul(c,i-prec,b,i))) 

else 

ai <- fadd(di t fsubCmuKprec.ci.b.i), mul(prec,c,i+prec,b,i+prec))) 

end if 
E.MULSUB.F: 

ai <- frsub(di, mul(prec,c,i,b,i)) 
E.MUL.SUB.C.F: 

if (i and prec) then 

ai <- frsub(di t fadd(mul(prec f c,i,b,i-prec), muKci-prec.bj))) 

else 

ai <- frsub(di, fsub(mul(prec,c,i,b,i), mul(prec,c,i+prec,b,i+prec))) 

endif 

endcase 

ai+prec-1..i *- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 

Fig. 38F 



Operati n codes 



E.SCALADD.F.16 


Ensemble scale add floating-point half 


E.SCAL.ADD.F.32 


Ensemble scale add floating-point single 


E.SCAL.ADD.F.64 


Ensemble scale add floating-point double 



Fig. 38G 



Selecti n 



class 


op 


prec 


scale add 


E.SCAL.ADD.F 


16 32 64 



Format 



E.SCALADD.F.size ra=rd,rc,rb 
ra=escaladdfsize(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I op I rd | rc | rb | ra 

8 6 6 6 6 



Fig. 38H 



Definition 

def EnsembleFloatingPointTemary(op l prec,rd l rc,rb.ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
for I <- 0 to 128-prec by prec 

di<-F(prec,di +pre c.i.j) 

ci<-F(prec.C} + p reo .ij) 

ai <- fadd(fmul(di, F(prec,b pre c.i..o)). frnul(cl, F(prec.b2* pre c-1..prec))) 
8|+prec-1 J «- PackF(prec, ai, none) 
endfor 

RegWrite(ra, 128. a) 
nddef 

Exceptions 

none 

Fig. 381 



C 0 1 IQ C 

b.oUB.r.lb 


tnsemDie suDtract tioating-point nait 


b.SUB.r.lb.U 


Ensemble subtract floating-point half ceiling 


C O 1 ID C A a c 

b.oUB.r.lb.r 


Ensemble subtract floating-point half floor 


C Ol ID C M 

b.oUD.r.lo.N 


bnsemDie suDtract floating-point nan nearest 


C CI ID C 7 

b.oUB.KIo.Z 


bnsembie subtract floating-point half zero 


C Ol ID C -iC V 

E.SUB.r.lO.X 


Ensemble subtract floating-point half exact 


C Ol ID CT OO 

b.SUB.F.32 


Ensemble subtract floating-point single 


r— oi in r— /> 

E.SUB.F.32.C 


Ensemble subtract floating-point single ceiling 


E.SUB.F.32.F 


Ensemble subtract floating-point single floor 


|— o 1 1 d r— oo K 1 

E.SUB.F.32.N 


Ensemble subtract floating-point single nearest 


j— oi in r~~ oo ~7 

E.SUB.F.32.Z 


Ensemble subtract floating-point single zero 


r— o i in r~ oo v/ 

E.SUB.F.32.X 


Ensemble subtract floating-point single exact 


E.SUB.F.64 


Ensemble subtract floating-point double 


r— • oi ID r~ O yl ^> 

E.SUB.F.64.C 


Ensemble subtract floating-point double ceiling 


r— oi ID I"~ £> y| f— 

E.SUB.F.64.F 


Ensemble subtract floating-point double floor 


r - • oi id r~ ^vl K 1 

E.SUB.F.64. N 


Ensemble subtract floating-point double nearest 


C Ol ID C ^ A ~7 

E.SUB.F.64.Z 


Ensemble subtract floating-point double zero 


F SUB F fi4 X 


l_ 1 IOCII IL/IC7 9UUU uLl IIVJOUI \KJ yJUli 11 UVJUUIC7 UACiul 


E.SUB.F.128 


Ensemble subtract floating-point quad 


E.SUB.F.128.C 


Ensemble subtract floating-point quad ceiling 


E.SUB.F.128.F 


Ensemble subtract floating-point quad floor 


E.SUB.F.128.N 


Ensemble subtract floating-point quad nearest 


E.SUB.F.128.Z 


Ensemble subtract floating-point quad zero 


E.SUB.F.128.X 


Ensemble subtract floating-point quad exact 



Fig. 39A 



Selection 



class 


op 


prec 


round/trap 


set 


SET. 
E LG 
L GE 


16 32 64 128 


NONE X 


subtract 


SUB 


16 32 64 128 


NONE C F N X Z 



Format 

E.op.prec.round rd=rb,rc 
rd=eopprecround(rb,rc) 

31 24 23 18 17 12 11 65 0 

| E.prec | rd | rc | rb | op.round | 

8 6 6 6 6 



Fig. 39B 



Definition 

def EnsembleReversedFloatingPoint(op,prec,round,rd,rc,rb) as 
c <- RegRead(rc, 128) 
b<- RegRead(rb, 128) 
for i <- 0 to 128-prec by prec 

ci^F(prec,Cj + p r ec-l..i) 

bi<-F(prec l bj + p re c-l..i) 

ai <- frsubr(ci,-bi, round) 

ai+prec-1..i <- PackF(prec, ai, round) 
endfor 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 39C 



Operation codes 



G.SET.E.F.16 


Group set equal floating-point half \ 


G.SET.E.F.16.X 


Group set equal floating-point half exact 


G.SET.E.F.32 


Group set equal floating-point single 


G.SET.E.F.32.X 


Group set equal floating-point single exact 


G.SET.E.F.64 


Group set equal floating-point double 


G.SET.E.F.64.X 


Group set equal floating-point double exact 


G.SET.E.F.128 


Group set equal floating-point quad 


G.SET.E.F.128.X 


Group set equal floating-point quad exact 


G.SET.GE.F.16.X 


Group set greater equal floating-point half exact 


G.SET.GE.F.32.X 


Group set greater equal floating-point single exact 


G.SET.GE.F.64.X 


Group set greater equal floating-point double exact 


G.SET.GE.F.128.X 


Group set greater equal floating-point quad exact 


G.SET.LG.F.16 


Group set less greater floating-point half 


G.SET.LG.F.16.X 


Group set less greater floating-point half exact j 


G.SET.LG.F.32 


Group set less greater floating-point single 


G.SET.LG.F.32.X 


Group set less greater floating-point single exact 


G.SET.LG.F.64 


Group set less greater floating-point double 


G.SET.LG.F.64.X 


Group set less greater floating-point double exact 


G.SET.LG.F.128 


Group set less greater floating-point quad 


G.SET.LG.F.128.X 


Group set less greater floating-point quad exact 


G.SET.L.F.16 


Group set less floating-point half 


G.SET.L.F.16.X 


Group set less floating-point half exact 


G.SET.L.F.32 


Group set less floating-point single 


G.SET.L.F.32.X 


Group set less floating-point single exact 


G.SET.L.F.64 


Group set less floating-point double 


G.SET.L.F.64.X 


Group set less floating-point double exact 


G.SET.L.F.128 


Group set less floating-point quad 


G.SET.L.F.128.X 


Group set less floating-point quad exact 


G.SET.GE.F.16 


Group set greater equal floating-point half 


G.SET.GE.F.32 


Group set greater equal floating-point single 


G.SET.GE.F.64 


Group set greater equal floating-point double 


G.SET.GE.F.128 


Group set greater equal floating-point quad 



Fig. 39D 



Equivalencies 



OCX I C C 4 G V 

G.ocT.Lb.r.ib.X 


CXrrw ir\ cot locc ani i ol flr\Qtinn_nnir\t Hotf ovart 
UFUUp ocl Icoo cijUal HUdUliy-puilll flail cXdUl 


/"* OCX ICC OO V 


firm in cot locc oniial flnstinn.onint cinnlo ovart 
vjiUUp oci icoo CLjUai i lUoui ly* pull 1 1 oiiiyic CAaui 


OCT ICC a. A V 

u.ot / .Lfc.r.04.A 


C^rrw m cot locc omial flosttnn.noint HonKlo oyart 
uiuup oci icoo ciJUdi iiuaui iy pun 11 UUULHC cAaul 


OCX ICC -too V 


CXmi ir\ cot locc onital flnsitinn-nriint ni iqH ovaM 
OIUUp oCI IBoo CljUdl IHJaul ly-puil 11 LjUdU cAdUl 


OCX /"* C 4/? 

G.ScT.G.r.lo 


firrM ir\ cot nroator fl^atinn-nrwnt Kolf 

oiuup oci yicaitJi uudiiny-fjuii u iidii 


/-\ OCX EZ 4 G \/ 

G.ScT.G.r.lb.X 


Prni i r\ cot nrootor flnotinn_r%r^trit K o If ovoM 

oroup Sci yrtJdier iiOdung-poini nan exact 


G.SET.G.F.32 


oroup sei greater noaung-poini single 


G.SE/.G.F.32.X 


oroup sei greater Floating-point single exact 


G. SET. G.F. 64 


oroup set greater Tioating-point aouDie 


VJ. OC 1 .Kj.r. OH. A. 


GrouD set areater floatina-Doint double exart 


G.SET.G.F.128 


Group set greater floating-point quad 


G.SET.G.F.128.X 


Group set greater floating-point quad exact 


G.SET.LE.F.16 


Group set less equal floating-point half 


G.SET.LE.F.32 


Group set less equal floating-point single 


G.SET.LE.F.64 


Group set less equal floating-point double 


G.SET.LE.F.128 


Group set less equal floating-point quad 



G.SET.G.F.prec rd=rb,rc 


-» 


G.SET.LF.prec rd=rc,rb 


G.SET.G.F.prec.X rd=rb,rc 


-> 


G.SET.LF.prec.X rd=rc,rb 


G.SET.LE.F.prec rd=rb,rc 


-» 


G.SET.GE.F.prec rd=rc,rb 


G.SET.LE.F.prec.X rd=rb,rc 


-> 


G.SET.GE.F.prec.X rd=rc,rb 



Fig. 39E 



Selection 



class 


op 


prec 


round/trap 


set 


SET. 

E LG 
L GE 
G LE 


16 32 64 128 


NONE X 



Format 



G.op.prec.round rd=rb,rc 
rc=gopprecround(rb,ra) 

31 24 23 18 17 12 11 65 0 

I G.prec | rd | rc | rb | op.round | 

8 6 6 6 6 



Fig 39F 



Definition 



def GroupFloatingPointReversedtop.prec.round.rd.rc.rb) as 
c <- RegRead(rc ? 128) 
b <- RegRead(rb, 128) 
for i 4- 0 to 128-prec by prec 
ci^F(prec,Cj +pr ec-1..i) 
bi <- F(prec,bj+p re c-i.j) 
if round^NONE then 

if (di.t = SNAN) or (ci.t = SNAN) then 
raise FloatingPointArithmetic 

endif 

case op of 

G.SET.L.F, G.SET.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.SET.L.F: 

ai <- bi?>ci 
G.SET.GE.F: 

ai <- bi!?<ci 
G.SET.E.F: 
ai bi=ci 
. G.SET.LG.F: 
ai <- bi*ci 

endcase 

ai+prec-1..i<-aiP rec 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Floating-point arithmetic 

Fig. 39G 



G.C0M.E.F.16 


Group compare equal floating-point half 


G.C0M.E.F.16.X 


Group compare equal floating-point half exact 


G.COM.E.F.32 


Group compare equal floating-point single 


G.COM.E.F.32.X 


Group compare equal floating-point single exact 


G.COM.E.F.64 


Group compare equal floating-point double 


G.COM.E.F.64.X 


Group compare equal floating-point double exact 


G.COM.E.F.128 


Group compare equal floating-point quad 


G.COM.E.F.128.X 


Group compare equal floating-point quad exact 


G.C0M.GE.F.16 


Group compare greater or equal floating-point half 


G.C0M.GE.F.16.X 


Group compare greater or equal floating-point half exact 


G.COM.GE.F.32 


Group compare greater or equal floating-point single 


G.COM.GE.F.32.X 


Group compare greater or equal floating-point single exact 


G.COM.GE.F.64 


Group compare greater or equal floating-point double ! 


G.COM.GE.F.64.X 


Group compare greater or equal floating-point double exact ; 


G.COM.GE.F.128 


Group compare greater or equal floating-point quad 


G.COM.GE.F.128.X 


Group compare greater or equal floating-point quad exact 


G.C0M.LF.16 


Group compare less floating-point half 


G.C0M.L.F.16.X 


Group compare less floating-point half exact 


G.COM.L.F.32 


Group compare less floating-point single 


G.COM.L.F.32.X 


Group compare less floating-point single exact 


G.COM.L.F.64 


Group compare less floating-point double j 


G.COM.LF.64.X 


Group compare less floating-point double exact 


G.COM.LF.128 


Group compare less floating-point quad 


G.COM.L.F.128.X 


Group compare less floating-point quad exact 


G.C0M.LG.F.16 


Group compare less or greater floating-point half 


G.C0M.LG.F.16.X 


Group compare less or greater floating-point half exact 


G.COM.LG.F.32 


Group compare less or greater floating-point single 


G.COM.LG.F.32.X 


Group compare less or greater floating-point single exact 


G.COM.LG.F.64 


Group compare less or greater floating-point double 


G.COM.LG.F.64.X 


Group compare less or greater floating-point double exact 


G.COM.LG.F.128 


Group compare less or greater floating-point quad 


G.COM.LG.F.128.X 


Group compare less or greater floating-point quad exact 



Fig. 40A 



Format 



G.COM.op.prec.round rd.rc 
rc=gcomGpprecround(rd,rc) 

31 24 23 18 17 12 11 6 5 0 

| G.prec | rd | rc | op | GCOM j 

8 6 6 6 6 



Fig. 40B 



Definition 

def GroupCompareFloatingPointfop.prec.round.rd.rc) as 
d <r- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
for i «- 0 to 128-prec by prec 
di<-F(prec,dj +P rec-1..i) 
ci<-F(prec,Cj +P rec-1.j) 
if round*NONE then 

if (di.t = SNAN) or (ci.t = SNAN) then 
raise FloatingPointArithmetic 

endif 

case op of 

G.COM.LF, G.COM.GE.F: 

if (di.t = QNAN) or (ci.t = QNAN) then 
raise FloatingPointArithmetic 

endif 
others: //nothing 
endcase 

endif 

case op of 

G.COM.LF: 

ai <- di?>ci 
G.COM.GE.F: 

ai <r- di!?<ci 
G.COM.E.F: 

ai <- di=ci 
G.COM.LG.F: 

ai <r- di^ci 

endcase 

ai+prec-1..i^-a> 
endfor 

if (a * 0) then 

raise FloatingPointArithmetic 

endif 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 40C 



E ABS F 16 


Ensemble absolute value floating-point half 


E ABS F 16 X 


Ensemble absolute value floating-point half exception 


E ABS.F.32 


Ensemble absolute value floating-point single 


E.ABS.F.32 X 


Ensemble absolute value floating-point single exception 


E ABS F 64 


Ensemble absolute value floating-point double 


E ABS.F.64 X 


Ensemble absolute value floating-point double exception 


E ABS F 128 


Ensemble absolute value floating-point quad 


E ABS F 1 28 X 


Ensemble absolute value floating-point quad exception 


E COPY F 16 


Ensemble copy floating-point half 


E COPY F 16 X 

fcaaa • ^a^ ^aar 1 1*1 • 1 w ».r > 


Ensemble copy floating-point half exception 


E COPY F 32 


Ensemble copy floating-point single 


E COPY F 32 X 


Ensemble copy floating-point single exception I 


E COPY F 64 


Ensemble copy floating-point double 


E.COPY.F.64.X 


Ensemble copy floating-point double exception 


E COPY F 128 

•Waa a Va# 1 I • 1 • 1 bV 


Ensemble copy floating-point quad 


E COPY F 128 X 


Ensemble copy floating-point quad exception 


E DEFLATE F 32 


Ensemble convert floating-point half from single 


E DEFLATE F 32 C 


Ensemble convert floating-point half from single ceiling 


E DEFLATE F 32 F 

• i ■ aaa*» a_ 1 1 f 1 1 hap • I • ■ 1 


Ensemble convert floating-point half from single floor 


E DEFLATE F 32 N 


Ensemble convert floating-point half from single nearest 


E DEFLATE F 32 X 


Ensemble convert floating-point half from single exact 


E DEFLATE F 32 Z 


Ensemble convert floating-point half from single zero 


E DEFLATE F 64 


Ensemble convert floating-point single from double 


E DEFLATE F 64 C 

a^» a •»■•* »aaa 1 1 r 1 1 L« • 1 ■ \*/ T • ^a^r 


Ensemble convert floating-point single from double ceiling 


E DEFLATE F 64 F 


Ensemble convert floating-point single from double floor | 


E DEFLATE F 64 N 

lav • La** l_ 1 ha># % 1 L_ a 1 •V^Ttl^l 


Ensemble convert floating-point single from double nearest 


E DEFLATE F 64 X 


Ensemble convert floating-point single from double exact 


E DEFLATE F 64 Z 


Ensemble convert floating-point single from double zero 


E DEFLATE F 128 


Ensemble convert floating-point double from quad 


E DEFLATE F 128 C 


Ensemble convert floating-point double from quad ceiling 


E DEFLATE F 128 F 


Ensemble convert floating-point double from quad floor 


E DEFLATE F 128 N 


Ensemble convert floating-point double from quad nearest 


E. DEFLATE F 128X 

•a» • la/ L« 1 IvaT * 1 Uil • 1 aWV a/X 


Ensemble convert floating-point double from quad exact 


E. DEFLATE F 128 Z 


Ensemble convert floating-point double from quad zero 


E.FL0AT.F.16 


Ensemble convert floating-point half from doublets 


E.FL0AT.F.16.C 


Ensemble convert floating-point half from doublets ceiling 


E.FL0AT.F.16.F 


Ensemble convert floating-point half frcn doublets floor 


E.FL0AT.F.16.N 


Ensemble convert floating-point half from doublets nearest 


E.FLOAT.F.16.X 


Ensemble convert floating-point half from doublets exact 


E.FL0AT.F.16.Z 


Ensemble convert floating-point half from doublets zero j 



Fig.41A 



E.FLOAT.F.32 


Ensemble convert floating-point single from quadlets 


E.FLOAT.F.32.C 


Ensemble convert floating-point single from quadlets ceiling 


E.FLOAT.F.32.F 


Ensemble convert floating-point single from quadlets floor 


E.FLOAT.F.32.N 


Ensemble convert floating-point singl from quadlets nearest 


E.FLOAT.F.32.X 


Ensemble convert floating-point single from quadlets exact 


E.FLOAT.F.32.Z 


Ensemble convert floating-point single from quadlets zero 


E.FLOAT.F.64 


Ensemble convert floating-point double from octlets 


E.FLOAT.F.64.C 


Ensemble convert floating-point double from octlets ceiling 


E.FLOAT.F.64.F 


Ensemble convert floating-point double from octlets floor 


E.FLOAT.F.64.N 


Ensemble convert floating-point double from octlets nearest 


E.FLOAT.F.64.X 


Ensemble convert floating-point double from octlets exact 


E.FLOAT.F.64.Z 


Ensemble convert floating-point double from octlets zero 


E.FLOAT.F.128 


Ensemble convert floating-point quad from hexlet 


E.FLOAT.F.128.C 


Ensemble convert floating-point quad from hexlet ceiling 


E.FLOAT.F.128.F 


Ensemble convert floating-point quad from hexlet floor 


E.FLOAT.F.128.N 


Ensemble convert floating-point quad from hexlet nearest 


E.FLOAT.F.128.X 


Ensemble convert floating-point quad from hexlet exact 


E.FLOAT.F.128.Z 


Ensemble convert floating-point quad from hexlet zero 


E.INFLATE.F.16 


Ensemble convert floating-point single from half 


E.INFLATE.F.16.X 


Ensemble convert floating-point single from half exception 


E. INFLATE. F.32 


Ensemble convert floating-point double from single 


E.INFLATE.F.32.X 


Ensemble convert floating-point double from single exception 


E.INFLATE.F.64 


Ensemble convert floating-point quad from double 


E.INFLATE.F.64.X 


Ensemble convert floating-point quad from double exception 


E.NEG.F.16 


Ensemble negate floating-point half 


E.NEG.F.16.X 


Ensemble negate floating-point half exception 


E.NEG.F.32 


Ensemble negate floating-point single 


E.NEG.F.32.X 


Ensemble negate floating-point single exception 


E.NEG.F.64 


Ensemble negate floating-point double 


E.NEG.F.64.X 


Ensemble negate floating-point double exception 


E.NEG.F.128 


Ensemble negate floating-point quad 


E.NEG.F.128.X 


Ensemble negate floating-point quad exception 


E.RECEST.F.16 


Ensemble reciprocal estimate floating-point half 


E.RECEST.F.16.X 


Ensemble reciprocal estimate floating-point half exception 


E.RECEST.F.32 


Ensemble reciprocal estimate floating-point single | 


b.KbUbo 1 .r.oz.A 


cnsemuie reciprocal estimate floating-point single exception 


E.RECEST.F.64 


Ensemble reciprocal estimate floating-point double 


E.RECEST.F.64.X 


Ensemble reciprocal estimate floating-point double exception 


E.RECEST.F.128 


Ensemble reciprocal estimate floating-point quad 


E.RECEST.F. 128.X 


Ensemble reciprocal estimate floating-point quad exception 



Fig. 41A (cont'd) 



E.RSQREST.F.16 


Ensemble floating-point reciprocal squar root estimate half 


E.RSQREST.F.16.X 


Ensemble floating-point r ciprocal square root estimate half exact 


E.RSQREST.F.32 


Ensemble floating-point reciprocal squar root estimate single 


E.RSQREST.F.32.X 


Ensemble floating-point reciprocal square root estimate single exact 


E.RSQREST.F.64 


Ensemble floating-point reciprocal square root estimate double 


E.RSQREST.F.64.X 


Ensemble floating-point reciprocal square root estimate double exact 


E.RSQREST.F.128 


Ensemble floating-point reciprocal square root estimate quad 


E.RSQREST.F. 128.X 


Ensemble floating-point reciprocal square root estimate quad exact 


E.SINK.F.16 


Ensemble convert floating-point doublets from half nearest default 


E.SINK.F.16.C 


Ensemble convert floating-point doublets from half ceiling 


E.SINK.F.16.C.D 


Ensemble convert floating-point doublets from half ceiling default 


E.SINK.F.16.F 


Ensemble convert floating-point doublets from half floor j 


E.SINK.F.16.F.D 


Ensemble convert floating-point doublets from half floor default 


E.SINK.F.16.N 


Ensemble convert floating-point doublets from half nearest 


E.SINK.F.16.X 


Ensemble convert floating-point doublets from half exact 


E.SINK.F.16.Z 


Ensemble convert floating-point doublets from half zero 


E.SINK.F.16.Z.D 


Ensemble convert floating-point doublets from half zero default 


E.SINK.F.32 


Ensemble convert floating-point quadlets from single nearest default 


E.SINK.F.32.C 


Ensemble convert floating-point quadlets from single ceiling 


E.SINK.F.32.C.D 


Ensemble convert floating-point quadlets from single ceiling default 


E.SINK.F.32.F 


Ensemble convert floating-point quadlets from single floor 


E.SINK.F.32.F.D 


Ensemble convert floating-point quadlets from single floor default 


E.SINK.F.32.N 


Ensemble convert floating-point quadlets from single nearest 


E.SINK.F.32.X 


Ensemble convert floating-point quadlets from single exact 


E.SINK.F.32.Z 


Ensemble convert floating-point quadlets from single zero 


E.SINK.F.32.Z.D 


Ensemble convert floating-point quadlets from single zero default 


E.SINK.F.64 


Ensemble convert floating-point octlets from double nearest default 


E.SINK.F.64.C 


Ensemble convert floating-point octlets from double ceiling 


E.SINK.F.64.C.D 


Ensemble convert floating-point octlets from double ceiling default 


E.SINK.F.64.F 


Ensemble convert floating-point octlets from double floor j 


E.SINK.F.64.F.D 


Ensemble convert floating-point octlets from double floor default 


E.SINK.F.64.N 


Ensemble convert floating-point octlets from double nearest 


E.SINK.F.64.X 


Ensemble convert floating-point octlets from double exact j 


E.SINK.F.64.Z 


Ensemble convert floating-point octlets from double zero 


E.SINK.F.64 .Z.D 


Ensemble convert floating-point octlets from double zero default 


E.SINK.F.128 


Ensemble convert floating-point hexlet from quad nearest default 


E.SINK.F.128.C 


Ensemble convert floating-point hexlet from quad celling 


E.SINK.F.128.C.D 


Ensemble convert floating-point hexlet from quad ceiling default 


E.SINK.F.128.F 


Ensemble convert floating-point hexlet from quad floor 


E.SINK.F.128.F.D 


Ensemble convert floating-point hexlet from quad floor default 
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E.SINK.F.128.N 


Ensemble convert floating-point hexlet from quad nearest 


E.SINK.F.128.X 


Ensemble convert floating-point hexlet from quad exact 


E.SINK.F.128.Z 


Ensemble convert floating-point hexlet from quad zero 


E.SINK.F.128.Z.D 


Ensemble convert floating-point hexlet from quad zero default 


E.SQR.F.16 


Ensemble square root floating-point half 


E.SQR.F.16. C 


Ensemble square root floating-point half ceiling 


E.SQR.F.16.F 


Ensemble square root floating-point half floor 


E.SQR.F.16.N 


Ensemble square root floating-point half nearest 


E.SQR.F.16.X 


Ensemble square root floating-point half exact 


E.SQR.F.16.Z 


Ensemble square root floating-point half zero 


E.SQR.F.32 


Ensemble square root floating-point single 


E.SQR.F.32.C 


Ensemble square root floating-point single ceiling 


E.SQR.F.32.F 


Ensemble square root floating-point single floor 


E.SQR.F.32.N 


Ensemble square root floating-point single nearest 


E.SQR.F.32.X 


Ensemble square root floating-point single exact 


E.SQR.F.32.Z 


Ensemble square root floating-point single zero 


E.SQR.F.64 


Ensemble square root floating-point double 


E.SQR.F.64.C 


Ensemble square root floating-point double ceiling 


E.SQR.F.64.F 


Ensemble square root floating-point double floor 


E.SQR.F.64.N 


Ensemble square root floating-point double nearest j 


E.SQR.F.64.X 


Ensemble square root floating-point double exact 


E.SQR.F.64.Z 


Ensemble square root floating-point double zero 


E.SQR.F.128 


Ensemble square root floating-point quad 


E.SQR.F.128.C 


Ensemble square root floating-point quad ceiling 


E.SQR.F.128.F 


Ensemble square root floating-point quad floor 


E.SQR.F.128.N 


Ensemble square root floating-point quad nearest 


E.SQR.F.128.X 


Ensemble square root floating-point quad exact 


E.SQR.F.128.Z 


Ensemble square root floating-point quad zero 


E.SUM.F.16 


Ensemble sum floating-point half 


E.SUM.F.16.C 


Ensemble sum floating-point half ceiling 


E.SUM.F.16.F 


Ensemble sum floating-point half floor 


E.SUM.F.16.N 


Ensemble sum floating-point half nearest 


E.SUM.F.16.X 


Ensemble sum floating-point half exact 


E.SUM.F.16.Z 


Ensemble sum floating-point half zero 


E.SUM.F.32 


Ensemble sum floating-point single 


t.oUIVI. r.o^.U 


^iiacmuitj ouiii nuduny-poini single ceiling 


E.SUM.F.32.F 


Ensemble sum floating-point single floor 


E.SUM.r32.N 


Ensemble sum floating-point single nearest 


E.SUM.F.32.X 


Ensemble sum floating-point single exact 


E.SUM.F.32.Z 


Ensemble sum floating-point single zero 
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E.SUM.F.64 


Ensemble sum floating-point double 


E.SUM.F.64.C 


Ensemble sum floating-point double ceiling 


E.SUM.F.64.F 


Ensemble sum floating-point double floor 


E.SUM.F.64.N 


Ensemble sum floating-point double nearest 


E.SUM.F.64.X 


Ensemble sum floating-point double exact 


E.SUM.F.64.Z 


Ensemble sum floating-point double zero 


E.SUM.F.128 


Ensemble sum floating-point quad 


E.SUM.F.128.C 


Ensemble sum floating-point quad ceiling 


E.SUM.F.128.F 


Ensemble sum floating-point quad floor 


E.SUM.F.128.N 


Ensemble sum floating-point quad nearest 


E.SUM.F.128.X 


Ensemble sum floating-point quad exact 


E.SUM.F.128.Z 


Ensemble sum floating-point quad zero 



Selection 





op 


prec 


round/trap \ 


copy 


COPY 


16 32 64 128 


NONE X 


absolute 
value 


ABS 


16 32 64 128 


NONE X j 


float from 
integer 


FLOAT 


16 32 64 128 


NONE C F N X Z 


integer 
from float 


SINK 


16 32 64 128 


NONE C F N X Z 
CD F.D Z.D 


increase 

format 

precision 


INFLATE 


16 32 64 


NONE X 


decrease 

format 

precision 


DEFLATE 


32 64 128 


noneCFNXZ. 


negate 


NEG 


16 32 64 128 


NONE X 


reciprocal 
estimate 


RECEST 


16 32 64 128 


NONE X 


reciprocal 
square root 
estimate 


RSQREST 


16 32 64 128 


NONE X 


square root 


SQR 


16 32 64 128 


NONE C F N X Z 


sum 


SUM 


16 32 64 128 


NONE C F N X Z 



Fig. 41 A (cont'd) 



Format 

E.op.prec.round rd=rc 
rd=eopprecround(rc) 

31 24 23 18 17 , 12 11 65 0 

| E.prec | rd | rc | op | E.UNARY | 

8 6 6 6 6 



Fig. 41 B 



Definition 

def EnsembleUnaryFloatingPointfop.prec.round.rd.rc) as 
c <- RegRead(rc, 128) 
case op of 

E.ABS.F, E.NEG.F, E.SQR.F: 
for i <r- 0 to 1 28-prec by prec 
ci<-F(prec,Cj +pr ec-1..i) 
case op of 
E.ABS.F: 

ai.t <- ci.t 
ai.s «- 0 
ai.e «- ci.e 
ai.f <- ci.f 
E.COPY.F: 
ai 4- ci 
E.NEG.F: 

ai.t <- ci.t 
ai.s «- ~ci.s 
ai.e «- ci.e 
ai.f <- ci.f 
E.RECEST.F: 

ai <- frecest(ci) 
E.RSQREST.F: 

ai <- frsqrest(ci) 
E.SQR.F: 

ai +- fsqr(ci) 

endcase 

ai+prec-1..i «- PackF(prec, ai, round) 
endfor 
E.SUM.F: 

p[0].t <- NULL 

for i <- 0 to 1 28-prec by prec 

p[i+prec] <- fadd(p[i], F(prec,Cj+p re c-i.. 
endfor 

a <- PackF(prec, p[128] f round) 
E.SINK.F: 

for i <— 0 to 1 28-prec by prec 

ci^Ffprec.Cj+prec-i.j) 

ai+prec-1..i <- fsinkr(prec, ci, round) 
endfor 
E.FLOAT.F: 

for i <- 0 to 1 28-prec by prec 

ci.t <- NORM 

ci.e <- 0 

ci.s <- q+prec-1 

ci.f 4- ci.s ? 1+~Cj+ P rec-2..i : Ci+ pre c-2..i 
ai+prec-1..i «- PackF(prec, ci, round) 
endfor 



Fig. 41 C 



E.INFLATE.F: 

for i <- 0 to 64-prec by prec 
ci<- F(prec,Ci +P rec.1..i) 

a M+prec+prec-l..i+i *- PackF(prec+prec, ci, round) 
endfor 
E.DEFLATE.F: 

for i <- 0 to 128-prec by prec 

ci^FtprecCj+prec.u) 

ai/2+prec/2-1..i/2 <- PackF(prec/2, ci, round) 
endfor 
ai27..64<-0 

endcase 

RegWrite[rd, 128, a] 
enddef 



Exceptions 

Floating-point arithmetic 



Fig. 41C (cont'd) 



E.MUL.G.8 


Ensemble multiply Galois field byte i 


E.MUL.G.64 


Ensemble multiply Galois field octlet | 



Fig. 42A 



Format 



E.MUL.G.size ra=rd,rc,rb 



ra=emulgsize(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

I E.MUL.G.size I rd | rc | rb I ra | 



Fig.42B 



Definition 

def c <- PolyMultiply(size,a,b) as 

p[ 0 ] <_ o 2 * size 

for k <- 0 to size-1 

p[k+1] <- p[k] A a k ? (0 slze - k || b || 0 k ) : 0 2#size 

endfor 

c <- p[size] 
enddef 

def c <- PolyResidue(size,a,b) as 
p[0] <- a 

for k <r- size-1 to 0 by -1 

p[k+1] +- p[k] * p[0] sl2e+ k ? (0 si2e - k || 1 1 || b || 0 k ) : 02*size 
endfor 

c<-p[size] s ize-1..0 
enddef 

def EnsembleTernary(op t size,rd,rc,rb,ra) as 
d <- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case op of 

E.MULG: 

for i <- 0 to 1 28-size by size 

asize-1+U<- Po!yResidue(sizePolyMul(size f Csjze-1+iJ»bsi ze -1+i.j).dsize-n 
endfor 

endcase 

RegWrite(ra f 128, a) 
enddef 



Exceptions 

none 



Fig. 42C 



2047 rd ( 1 2 8 ) 



127 




Ensemble multiply Galois field bytes 
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X.C0MPRESS.2 


Crossbar compress signed pecks 


X.C0MPRESS.4 


Crossbar compress signed nibbles 


X.C0MPRESS.8 


Crossbar compress signed bytes 


X.C0MPRESS.16 


Crossbar compress signed doublets 


X.COMPRESS.32 


Crossbar compress signed quadlets 


X.COMPRESS.64 


Crossbar compress signed octlets 


X.COMPRESS.128 


Crossbar compress signed hexlet 


X.C0MPRESS.U.2 


Crossbar compress unsigned pecks 


X.C0MPRESS.U.4 


Crossbar compress unsigned nibbles 


X.C0MPRESS.U.8 


Crossbar compress unsigned bytes 


X.C0MPRESS.U.16 


Crossbar compress unsigned doublets 


X.COMPRESS.U.32 


Crossbar compress unsigned quadlets j 


X.COMPRESS.U.64 


Crossbar compress unsigned octlets 


X.COMPRESS.U.128 


Crossbar compress unsigned hexlet 


X.EXPAND.2 


Crossbar expand signed pecks 


X.EXPAND.4 


Crossbar expand signed nibbles 


X.EXPAND.8 


Crossbar expand signed bytes 


X. EXPAND. 16 


Crossbar expand signed doublets 


X.EXPAND.32 


Crossbar expand signed quadlets 


X.EXPAND.64 


Crossbar expand signed octlets 


X. EXPAND. 128 


Crossbar expand signed hexlet j 


X.EXPAND.U.2 


Crossbar expand unsigned pecks [ 


X.EXPAND.U.4 


Crossbar expand unsigned nibbles 


X.EXPAND.U.8 


Crossbar expand unsigned bytes 


X.EXPAND.U.16 


Crossbar expand unsigned doublets 


X.EXPAND.U.32 


Crossbar expand unsigned quadlets 


X.EXPAND.U.64 


Crossbar expand unsigned octlets 


X.EXPAND.U.128 


Crossbar expand unsigned hexlet j 


X.R0TL.2 


Crossbar rotate left pecks 


X.R0TL.4 


Crossbar rotate left nibbles ( 


X.R0TL.8 


Crossbar rotate left bytes 


X.R0TL.16 


Crossbar rotate left doublets 


X.ROTL.32 


Crossbar rotate left quadlets 


X.ROTL.64 


Crossbar rotate left octlets 


X.ROTL128 


Crossbar rotate left hexlet 


X.R0TR.2 


Crossbar rotate right pecks 


X.R0TR.4 


Crossbar rotate right nibbles 1 


X.R0TR.8 | 


Crossbar rotate right bytes 


X.R0TR.16 


Crossbar rotate right doublets 



Fig. 43A 



a.KU 1 K.oZ 


crossbar rotate right quadlets 


Y DHTD C/1 

A.KU 1 K.04 


orossbar rotate right octlets 


Y DHTD A OQ 


urossbar rotate right hexlet 


Y CUI O 


orossbar shift left pecks 


Y CUI O 

A.onL.^.U 


Crossbar shift left signed pecks check overflow 


Y QUI A 


urossbar snitt left nibbles 


v cui a r\ 
A.OHL.4.U 


Crossbar shift left signed nibbles check overflow 


V CUI Q 

A.5HL.O 


Crossbar shift left bytes 


v cui 0 r\ 
A.SrlL.o.O 


Crossbar shift left signed bytes check overflow 


X.SHL.16 


Crossbar shift left doublets 


V O III A C /~\ 

X.SHL.16.0 


Crossbar shift left signed doublets check overflow 


V OLJI OO 

A.SHL.32 


Crossbar shift left quadlets 1 


V O 1 II A 

A.SHL.32.0 


Crossbar shift left signed quadlets check overflow 


V CUI CA 

A.SHL.64 


Crossbar shift left octlets 


V OLJI ca r\ 

A.SnL.64.0 


Crossbar shift left signed octlets check overflow 


V CUI A OO 

A.5HL.12o 


Crossbar shift left hexlet 


v cut a 00 r\ 
A.orlL.12o.O 


Crossbar shift left signed hexlet check overflow 


A.bnL.U.2.0 


Crossbar shift left unsigned pecks check overflow 


V CUI 1 1 A t\ 

A.5HL.U.4.0 


Crossbar shift left unsigned nibbles check overflow 


V CUI I I O A 

A.orlL.U.o.O 


Crossbar shift left unsigned bytes check overflow 


V OLJI 1 1 A 0 r\ ~" 


Crossbar shift left unsigned doublets check overflow \ 


V CUI II OO /"\ 

A.5nL.U.32.u 


Crossbar shift left unsigned quadlets check overflow 


A.SHL.U.64.U 


Crossbar shift left unsigned octlets check overflow 


V OLJI 1 1 A OO f\ 

A.SHL.U.128.0 


Crossbar shift left unsigned hexlet check overflow 


V CUD O 
A.OHK.2 


Crossbar signed shift right pecks 


V CUD A 
A.OHK.4 


Crossbar signed shift right nibbles 


V CUD O 

A.0HK.0 


Crossbar signed shift right bytes 


V CUD A 

A.onK.16 


Crossbar signed shift right doublets 


V CUD OO i 

A.orlK.32 


Crossbar signed shift right quadlets | 


V CUD C A 


Crossbar signed shift right octlets 


V CUD -IOO 


Crossbar signed shift right hexlet 


V CUD 1 1 O 
A.OMK.U.2 


Crossbar shift nght unsigned pecks 


X.SHR U 4 


Crossbar ^hlft rinht uncinnorl nihhloc 


X.SHR.U.8 | 


Crossbar shift right unsigned bytes 


X.SHR.U.16 


Crossbar shift right unsigned doublets 


X.SHR.U.32 


Crossbar shift right unsigned quadlets 1 


X.SHR.U.64 


Crossbar shift right unsigned octlets 


X.SHR.U.128 


Crossbar shift right unsigned hexlet 



Fig. 43A (cont'd) 



Selection 



class 


op 


size 


precision 


EXPAND EXPAND.U 
COMPRESS 

COMPRESS. 

U 


2 4 8 16 32 64 128 


shift 


ROTR ROTL SHR SHL 
SHL.O SHLU.O 
SHR.U 


2 4 8 16 32 64 128 



Format 

X.op.size rcNrc.rb 
rd=xopsize(rc,rb) 

31 252423 18 17 12 11 6 5 21 0 

I XSHIFT ls| rd I rc | rb | op Tszl 

7 1 6 6 6 4 2 

Isize <- log(size) 
s <- Isize2 
sz<- Isize i.o 



Fig. 43B 



Definition 



def Crossbar(op,stze,rd,rc,rb) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
shift <- b and (size-1) 
case ops.,2 II 0 2 of 
X.COMPRESS: 
hsize +- size/2 

for i <r- 0 to 64-hsize by hsize 
if shift < hsize then 

a i+hsize-1..i «- Cj+j+shift+hsize-1..i+i+shift 

else 

aj+hsize-1 ..i «- <^+s&e?P II Ci+i+size-1 ..i+i +S hift 

endif 
endfor 
ai27..64<-0 
X.COMPRESS.U: 
hsize <- size/2 

for i <r- 0 to 64-hsize by hsize 
if shift < hsize then 

a i+hsize-1..i «- Cj+j+shift+hsize-1 ..i+i+shift 

else 

a| + hsize-1..i *- OShift-hsize || c W+size .i..w + shift 

endif 
endfor 
ai27..64«~0 
X. EXPAND: 

hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift < hsize then 

aw + size-1..W <- cftfegf || ^ h$iz ^j || 0*™ 

else 

ai+i+size-1..i+i <- c i+size-shift-1 ..i II ° shift 

endif 
endfor 
X.EXPAND.U: 

hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift < hsize then 

aw +S ize-1..M <- O h size-shift || c^;^ j || O^hift 

else 

ai+i+size-1..i+! «- Ci+size-shifM..i II ° sh[ft 

endif 
endfor 
X.ROTL: 

for i <- 0 to 128-size by size 

ai+size-1..i <- Ci+size-1 -shift. i II Cj+ S ize-1..i+size-1 -shift 
endfor 



Fig. 43C 



X.ROTR: 

for i <- 0 to 128-size by size 

ai+size-1 ..i <- Cj+ S hift-1 ..i II Ci+size-1 ..i+shift 
endfor 
X.SHL: 

for i <- 0 to 128-size by size 

aj+size-1..i <- Ci+size-1-shift..i II 0 shift 
endfor 
X.SHLO: 

for i +- 0 to 128-size by size 

if Cj+size-1 ..i+size-1-shift * ^+ h jlz€h1 -shift then 
raise FixedPointArithmetic 

endif 

ai+size-1. .i «- Ci +S ize-1-shift..ill 0 shift 
endfor 
X.SHLU.O: 

for i +- 0 to 128-size by size 

if q+size-1 ..i+size-shift * 0 shlft then 
raise FixedPointArithmetic 

endif 

ai+size-1. .i «- Ci+size-1-shrfull 0 shlft 
endfor 
X.SHR: 

for i <— 0 to 128-size by size 

ai+size-1 .J <- cf+^e-l II c i+size-1.. i+shift 
endfor 
X.SHR.U: 

for i +- 0 to 128-size by size 

ai+size-1 .J «- 0 shift || Cj+sfee-L. j+shift 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 



Fig. 43C (cont'd) 



1 lli ill 1 


m i mm \ I l»« 1 1 






II 





Compress 32 bits to 16, with 4-bit right shift 



Fig. 43D 



Operation codes 



X SHL M 2 


f^rr^ccKar oh iff I oft morno norl^c 

uiuobudi oi ill i icii iTicrye pt?(Jr\o 


X SHL M 4 


f^rr^cchar chift loft morno nihhloo 
oiuooudi oiiiii ion niciyt? iiiuuico 


X SHL M 8 


f^rocchar oh iff I off mo mo h\/toe 

uiuoouai oiiiii mil incryt? uyieo 


X SHL M 16 


Prncchar oh iff (off mo mo Hoi i Kioto 
v/IUooUdl o I Ull loll lilciyt? UUUUIolo 


X SHI M 12 


Prncchar oh iff I off marna ni lorllafo 
UlUooUdl ol llll 1611 IllfcJiyt? QU0UI6IS 


X ^Hl M 64 
/\. o n l. . i vi . u*t 


Prncchor ohiff laft nrtarriA ^/^tl^to 

vvrubbudi on iii leu merge ociieis 


y qui y ioq 


urossDar snm len merge nexiei 


X.SHR.M.2 


Crossbar shift riaht merae Decks 


X.SHR.M.4 


Crossbar shift right merge nibbles 


X.SHR.M.8 


Crossbar shift right merge bytes 


X.SHR.M.16 


Crossbar shift right merge doublets 


X.SHR.M.32 


Crossbar shift right merge quadlets 


X.SHR.M.64 


Crossbar shift right merge octlets 


X.SHR.M.128 


Crossbar shift right merge hexlet 



Fig. 43E 



Format 



X.op.size rd@rc,rb 
rd=xopsize(rd,rc,rb) 

31 252423 18 17 12 11 65 21 0 

I XSHIFT |s| rd | rc | rb | op | sz | 

7 1 6 6 6 4 2 

Isize <r- log(size) 
s <- Isize2 
sz <r- lsizei..o 

Fig 43F 



Definition 

def Crossbarlnplace(op ( size,rd,rc,rb) as 
d <- RegRead(rd, 128) 
c <r- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
shifts- band (size-1) 
for i «- 0 to 1 28-size by size 
case op of 

X.SHR.M: 

a i+size-1..i <- Ci+shift-1..i II dj+size-1..i+shift 
X.SHLM: 

ai+size-1..i <- d|+size-1-shifU II Cj +S hitt-1..i 

endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

none 



Fig 43G 



Operation codes 



X.COMPRESS.1.2 


Crossbar compress immediate signed pecks 


X.COMPRESS.1.4 


Crossbar compress immediate signed nibbles 


X.COMPRESS.1.8 


Crossbar compress immediate signed bytes 


X.COMPRESS.1.16 


Crossbar compress immediate signed doublets 


X.COMPRESS.I.32 


Crossbar compress immediate signed quadlets 


X.COMPRESS.I.64 


Crossbar compress immediate signed octlets 


X.COMPRESS.1.128 


Crossbar compress immediate signed hexlet 


X.COMPRESS.I.U.2 


Crossbar compress immediate unsigned pecks 


X.COMPRESS.I.U.4 


Crossbar compress immediate unsigned nibbles 


X.COMPRESS.I.U.8 


Crossbar compress immediate unsigned bytes 


X.COMPRESS.I.U.16 


Crossbar compress immediate unsigned doublets 


X.COMPRESS.I.U.32 


Crossbar compress immediate unsigned quadlets 


X.COMPRESS.I.U.64 


Crossbar compress immediate unsigned octlets 


X.COMPRESS.I.U.128 


Crossbar compress immediate unsigned hexlet 


X. EXPAND. 1. 2 


Crossbar expand immediate signed pecks 


X. EXPAND. 1. 4 


Crossbar expand immediate signed nibbles 


X.EXPAND.I.8 


Crossbar expand immediate signed bytes 


X.EXPAND.1.16 


Crossbar expand immediate signed doublets 


X. EXPAND. 1. 32 


Crossbar expand immediate signed quadlets 


X.EXPAND.I.64 


Crossbar expand immediate signed octlets 


X.EXPAND.1.128 


Crossbar expand immediate signed hexlet 


X.EXPAND.I.U.2 


Crossbar expand immediate unsigned pecks 


X.EXPAND.I.U.4 


Crossbar expand immediate unsigned nibbles 


X.EXPAND.I.U.8 


Crossbar expand immediate unsigned bytes 


X. EXPAND. I. U. 16 


Crossbar expand immediate unsigned doublets 


X.EXPAND.I.U.32 


Crossbar expand immediate unsigned quadlets 


X. EXPAND. I. U. 64 


Crossbar expand immediate unsigned octlets 


X.EXPAND.I.U.128 


Crossbar expand immediate unsigned hexlet 


X.ROTL.I.2 


Crossbar rotate left immediate pecks 


X.ROTL.I.4 


Crossbar rotate left immediate nibbles 


X.ROTL.I.8 


Crossbar rotate left immediate bytes 


X.ROTL.1.16 


Crossbar rotate left immediate doublets 


X.ROTL.I.32 


Crossbar rotate left immediate quadlets 


X.ROTL.I.64 


Crossbar rotate left immediate octlets 


X.ROTL.1.128 


Crossbar rotate left immediate hexlet 


X.ROTR.I.2 


Crossbar rotate right immediate pecks 


X.ROTR.I.4 


Crossbar rotate right immediate nibbles 


X.ROTR.I.8 


Crossbar rotate right immediate bytes 


X.ROTR.1.16 


Crossbar rotate right immediate doublets 


X.ROTR.I.32 


Crossbar rotate right immediate quadlets 


X.ROTR.I.64 


Crossbar rotate right immediate octlets 


X.ROTR.1.128 


Crossbar rotate right immediate hexlet 



Fig. 43H 



X.SHL.1.2 


Crossbar shift left immediate pecks 


\/ III 1 

X.SHL.1.2. 0 


Crossbar shift left immediate signed pecks check overflow 


V/ Ol II 1 A 

X.SHL.1.4 


Crossbar shift left immediate nibbles 


V/ Ol II 1 A y— v 

X.SHL.1.4. 0 


Crossbar shift left immediate signed nibbles check overflow 


W Al II 1 O 

X.SHL.1.8 


Crossbar shift left immediate bytes 


X.SHL.I.8.0 


Crossbar shift left immediate signed bytes check overflow 


X.SHL.1.16 


Crossbar shift left immediate doublets 


V/ f \ III 1 ^ /\ 

X.SHL.I.16.0 


Crossbar shift left immediate signed doublets check overflow 


X.SHL.I.32 


Crossbar shift left immediate quadlets 


\/ K\ 1 II I ^X 

X.SHL.I.32.0 


Crossbar shift left immediate signed quadlets check overflow 


X.SHL.1.64 


Crossbar shift left immediate octlets 


X.SHL.I.64.0 


Crossbar shift left immediate signed octlets check overflow f 


X.SHL.1.128 


Crossbar shift left immediate hexlet 


X.SHL.I.128.0 


Crossbar shift left immediate signed hexlet check overflow 


x y i ii iii a0^. 

X.SHLI.U.2.0 


Crossbar shift left immediate unsigned pecks check overflow 


X.SHL.I.U.4.0 


Crossbar shift left immediate unsigned nibbles check overflow 


X.SHL.I.U.8.0 


Crossbar shift left immediate unsigned bytes check overflow 


v y ^\ III iii j 

X.SHL.I.U.16.0 


Crossbar shift left immediate unsigned doublets check overflow 


X.SHL.I.U.32.0 


Crossbar shift left immediate unsigned quadlets check overflow 


V/ ^X III III ^* a 

X.SHL.I.U.64.0 


Crossbar shift left immediate unsigned octlets check overflow 


X.SHLI.U.128.0 


Crossbar shift left immediate unsigned hexlet check overflow j 


X.SHR.1.2 


Crossbar signed shift right immediate pecks 


X.SHR.1.4 


Crossbar signed shift right immediate nibbles 


X.SHR.1.8 


Crossbar signed shift right immediate bytes j 


XX ^X I 1 1 -4 *H 

X.SHR.1.16 


Crossbar signed shift right immediate doublets 


X.SHR.I.32 


Crossbar signed shift right immediate quadlets 


X/ ^X 1 I I A 

X.SHR.1.64 


Crossbar signed shift right immediate octlets 


X.SHR.1.128 


Crossbar signed shift right immediate hexlet 


X.SHR.I.U.2 


Crossbar shift right immediate unsigned pecks j 


X SHR I U 4 


uiuooudi oinii fiyiii ii in iicuicuc unsigneo niDDies 


X.SHR.I.U.8 


Crossbar shift right immediate unsigned bytes 


X.SHR.I.U.16 


Crossbar shift right immediate unsigned doublets 


X.SHR.I.U.32 


Crossbar shift right immediate unsigned quadlets 


X.SHR.I.U.64 


Crossbar shift right immediate unsigned octlets 


X.SHR.I.U.128 


Crossbar shift right immediate unsigned hexlet 



Fig. 43H (cont) 



Selection 



class 


op 


size 


nrpricinn 


vulVirrxLOO.I 

COMPRESS.I.U EXPAND.I 
EXPAND.I.U 


9 4 O 4(5 OO CA 100 
t 1 O ID OZ 0*1 \£.0 


shift 


ROTL.I ROTR.I 
SHLI SHLI.O 
SHLI.U.O 
SHR.I SHR.I.U 


2 4 8 16 32 64 128 


copy ! 


COPY 





Format 



X.op.size rd=rc,shift 
rd=xopsize(rc,shift) 

31 24 23 18 17 12 11 6 5 0 

I XSHIFTI I rd | rc | simm | op ~~| 

8 6 6 6 6 

t <- 256-2*size+shift 
opi..o<-t7..6 
simm <r- t5..o 



Fig. 43! 



Definition 

def CrossbarShortImmediate(op,rd,rc,simm) 
case (opi..o II simm) of 
0..127: 



size 


<— 


128 


128..191: 






size 


i— 


64 


192..223: 






size 


<— 


32 


224..239: 






size 


<- 


16 


240..247: 






size 


<— 


8 


248..251 : 






size 


<— 


4 


252..253: 






size 


<- 


2 


254..255: 







raise Reservedlnstruction 

endcase 

shift <r- (opo || simm) and (size-1) 
c <- RegRead(rc f 128) 
case (ops„2 II 0 2 ) of 
X.COMPRESS.I: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift < hsize then 

ai+hsize-1..i <- c i+i+shift+hsize-1..i+i+shift 

else 

aj+hsize-1 J «- II Cj+j +S ize-1 ..i+i+shift 

end if 
endfor 
ai27..64<-0 
X.COMPRESS.LU: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift < hsize then 

aj+hsize-1..i <~ Cj+j+ S hift+hsize-1..i+i+shift 

else 

ai+hsize-1..i «- 0 shift " hsize || c i+ i + size-1..W+shift 

endif 
endfor 
ai27..64«-0 



Fig. 43J 



X.EXPAND.I: 

hsize <- size/2 

for i <— 0 to 64-hsize by hsize 
if shift < hsize then 

aw +S ize.1..i + i «- c^|!f || c l+hsiz ^j || 0» h « 

else 

aj+i+size-U+i «- Ci+size-shift-1..i II ° shift 

end if 
endfor 
X.EXPAND.I.U: 
hsize <- size/2 

for i <- 0 to 64-hsize by hsize 
if shift < hsize then 

aw +S ize-1..M «- O h size-shift || c i+hsize . 1 j || oshift 

else 

3i+i+size-1..i+i «- Ci+size-shifM..i II ° shift 

endif 
endfor 
X.SHLI: 

for i <- 0 to 128-size by size 

ai+size-1..i «- Ci +S i Z e-i-shift.ill 0 shifl 
endfor 
X.SHLI.O: 

for i <r- 0 to 128-size by size 

if Cj+size-1 ..i+size-1 -shift * -shift then 

raise FixedPointArithmetic 

endif 

ai+size-1..i <- Cj +S ize-1-shifUll 0 sh[ft 
endfor 
X.SHLLU.O: 

for i <- 0 to 128-size by size 

if Cj+size-U+size-shift * 0 shlft then 
raise FixedPointArithmetic 

endif 

ai+size-1..i «- Cj+size-1-shift..ill 0 shift 
endfor 

Fig. 43J (cont) 



X.ROTR.I: 

for i <- 0 to 128-size by size 

a i+size-1 ..i «- C|+shift-1 ..i II Cj+ S jze-1 ..i+shift 
endfor 
X.SHR.I: 

for i <- 0 to 128-size by size 

a i+S rze-1 J «- cf+sL-1 II c i+size-1 ..i+shift 
endfor 
X.SHR.I.U: 

for i <- 0 to 128-size by size 

aj +S ize-1..i «- 0 shlft II c j+size . 1 J+Shift 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Fixed-point arithmetic 
Reserved Instruction 

Fig. 43J (cont) 



Operation codes 



V f>l II h A 1 O 

X.SHLM.1.2 


Crossbar shift left merge immediate pecks 


V 0 1 II K A 1 A 

X.SHL.M.1.4 


Crossbar shift left merge immediate nibbles 


X.SHL.M.I.o 


Crossbar shift left merge immediate bytes 


\S O 1 II ft M 1 A /*» 

X.SHLM.1.16 


Crossbar shift left merge immediate doublets 


a.SHL.M.1.32 


- — — I 1 • Jtl. 1 fl • 1 » ft ft ft . S 

Crossbar shift left merge immediate quadlets 


v/ f\ m | ft j t O >i 

X.SHLM.1.64 


_ _ | • _ • _aT» i ^ft • t • a ft a « 

Crossbar shift left merge immediate octlets 


X.SHLM. 1.128 


Crossbar shift left merge immediate hexlet » 


X SHR M I 2 


^luoouai oi mi nym iiiciyc irnrnsuiai© pecKS 


X.SHR.M.I.4 


Crossbar shift right merge immediate nibbles 


X.SHR.M.I.8 


Crossbar shift right merge immediate bytes j 


X.SHR.M.1.16 


Crossbar shift right merge immediate doublets 


X.SHR.M.I.32 


Crossbar shift right merge immediate quadlets 


X.SHR.M.I.64 


Crossbar shift right merge immediate octlets 


X.SHR.M.1.128 


Crossbar shift right merge immediate hexlet 



Fig 43K 



Format 



X.op.size rd@rc,shift 
rd=xopsize(rc,shift) 

31 24 23 18 17 12 11 65 0 

I XSHIFTI | rd | fc I simm | op | 

8 6 6 6 6 

t <- 256-2*size+shift 
OP1..0 *-t7„6 
simm <- 1 5 . 0 

Fig 43L 



Definition 

def CrossbarShortlmmediatelnplace(op t rd,rc ? simm) 
case (opi„o || simm) of 
0..127: 

size <- 128 
128..191: 

size <- 64 
192..223: 

size <r- 32 
224..239: 

size <- 16 
240..247: 

size <- 8 
248..251: 

size <- 4 
252..2S3: 

size <- 2 
254..2S5: 

raise Reserved Instnjction 

endcase 

shift <- (opo || simm) and (size-1) 
c <- RegRead(rc, 128) 
d <- RegRead(rd, 128) 
for i <r- 0 to 128-size by size 
case (OP5..2 II 0 2 ) of 
X.SHR.M.I: 

ai+size-1.j <- Cj+ S hift-1..i II di+size-1..i+shift 
X.SHLM.I: 

3i+size-1.j <- di+size-1-shifU II Ci+shift-1..i 

endcase 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved Instruction 

Fig 43M 



Format 



X. EXTRACT ra=rd,rc,rb 



ra=xextract(rd,rc,rb) 

31 24 23 18 17 12 11 65 

I QP I rd | rc | rb | ra 



8 



Fig. 44A 



Definition 



def CrossbarExtract(op,ra,rb,rc,rd) as 
d «- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case b^o of 



0..255: 




gsize 


<-128 


256..383: 




gsize 


<-64 


384.447: 




gsize 


<-32 


448..479: 




gsize 


<-16 


480..495: 




gsize 


<-8 


496..503: 




gsize 


<-4 


504..507: 




gsize 


<-2 


508..511: 




gsize 


«- 1 



endcase 
m <— b-|2 

as <- signed «- b-|4 
h <- (2-m)*gsize 

spos <- (be..o) and ((2-m)*gsize-1) 
dpos <- (0 || b23..ie) ana * (gsize-1) 
sfsize (0 || b3i 24) and (Qsize-1) 

tfsize <- (sfsize = 0) or ((sfeize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize «- (tfsize + spos > h) ? h - spos : tfsize 
for i <- 0 to 128-gsize by gsize 
case op of 

X. EXTRACT: 
if m then 

P<-dgsize+M..i 

else 

P<-(d Hc)2*(gsize+iH..2*i 

endif 

endcase 

v4-(as&p M )||p 

w <- (as & vspos+fsize-l) 9512 ^ 12 ^ 1508 II vfsize-1+spos..spos II 0 d P° s 
if m then 

a size-1+Li «- Cgsize-l+Ldpos+fsize+i II w dpos+fsize-1..dpos II Cdpos-I+U 

else 

a size-1+Li<- w 

endif 

endfor 

RegWrite(ra, 128, a) 
enddef 



Exceptions 

none 



Fig. 44B 



< — foizc » < dpos 
Crossbar extract 

Fig. 44C 




Fig. 44D 



Operation codes 



E.MULX 


Ensemble multiply extract 


E. EXTRACT 


Ensemble extract j 


E.SCAL.ADD.X 


Ensemble scale add extract 



Fig. 44E 



Format 

E.op ra=rd,rc,rb 
ra=eop(rd,rc,rb) 

31 24 23 18 17 12 11 6 5 0 

I °P I rd | rc I rb | ra I 

8 6 6 6 6 



Fig. 44F 



def mul(size,h,vs,v t i,ws,w,j) as 

mul <- ((vs&v size .i + i) h - sjze || v si2e . 1+u ) * ((ws&w size .i + j) h - size || Wsfee-1+j.j) 
enddef 

def EnsembleExtract(op f ra,rb,rc,rd) as 
d «- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
case b8 4 .o of 
0..255: 

sgsize <- 128 
256..383: 

sgsize <- 64 
384..447: 

sgsize <- 32 
448..479: 

sgsize <- 16 
480..495: 

sgsize <- 8 
496..503: 

sgsize <- 4 
504..507: 

sgsize <- 2 
508..511: 

sgsize <- 1 

endcase 
l<-bn 
m <— b-12 
n <- bi3 
signed <- bi4 
case op of 

E. EXTRACT: 

gsize <- sgsize 

h <r- (2-m)*gsize 

as «- signed 

spos <- (be„o) and ((2-m)*gsize-1 ) 
E.SCAL.ADD.X: 

if (sgsize < 8) then 

gsize <- 8 
elseif (sgsize*(n+1) > 32) then 
gsize <-32/(n+1) 

else 

gsize <- sgsize 

endif 

ds <- cs <- signed 

bs <- signed A m 

as <- signed or m or n 

h <- (2*gsize) + 1 + n 

spos <- (b8..o) and (2*gsize-1) 

Fig. 44G 



E.MUL.X: 

if (sgsize < 8) then 

gsize <- 8 
elseif (sgsize*(n+1 ) > 1 28) then 

gsize <- 128/(n+1) 

else 

gsize <- sgsize 

endif 

ds <- signed 

cs <- signed A m 

as <- signed or m or n 

h <- (2*gsize) + n 

spos <- (bs..o) and (2*gsize-1) 

endcase 

dpos <- (0 || b23..l6) and (gsize-1) 
r <- spos 

sfsize <- (0 || b3i..24) and (gsize-1) 

tfsize <- (sfsize = 0) or ((sfsize+dpos) > gsize) ? gsize-dpos : sfsize 
fsize <- (tfsize + spos > h) ? h - spos : tfsize 
if (&10..9 = Z) and not as then 
rnd <- F 

else 

rnd<-bio..9 

endif 

for i <- 0 to 128-gsize by gsize 
case op of 

E. EXTRACT: 
if m then 

P<-dgsize+i-1..i 

else 

p^(d||c)2*(g S ize+i)-1..2*i 

endif 
E.MUL.X: 
if n then 

if (i and gsize) = 0 then 

p <- muKgsize.h.ds.d.i.cs.cj) - mul(gsize l h,ds,d,i+size,cs,c t i+size) 

else 

p <- muKgsize.h^s.d.Us.cj+size) + muKgsize.h.ds.d.i.cs.cj+size) 

endif 

else 

p <- muKgsize^.ds.d.i.cs.ci) 

endif 

Fig. 44G (cont) 



E.SCALADD.X: 
if n then 

if (i and gsize) = 0 then 

p <- mu!(gsize f h l ds,d,i,b$,b,64+2*gsize) 
+ muKgsize.h.cs.cJ.bs.b.M) 

- mul(gsize t h 1 ds,d,i+gsize,bs ? b,64+3*gsize) 

- mul(gsize f h,cs t c l i+gsize,bs f b f 64+gsize) 

else 

p <- muKgsize.h.ds.d.i.bs.b^+S'gsize) 
+ mul(gsize,h f cs t c f i,bs,b,64+gsize) 
+ mul(gsize f h,ds,d f i+gsize f bs,b f 64+2*gsize) 
+ mul(gsize f h f cs f c,i+gsize,bs,b f 64) 

endif 

else 

p <r- mul(gsize,h f ds,d ( i,bs t b,64+gsize) + mul(gsize l h f cs l c > i,bs,b,64) 

endif 

endcase 
case rnd of 
N: 

S<-0h-r||~p r ||pM 

Z: 

so-O^II p^ 

F: 

s<-0 h 

C: 

s 0 h " r || 1 r 

endcase 

v*-((as&p h . 1 )||p) + (0||s) 

'f (Vh..r+fsize = (as & v r+ f size -i) h+1 - r - fsi2 e) or not (I and (op = E. EXTRACT)) then 
w <- (as & v r+fsi2e -i)9size-fsize-dpos || Vfsize _ Ur j || O dpos 

else 

w <- (s ? (v h || - v fl size -dpos-1) • igsize-dpos) || O dpos 

endif 

if m and (op = E.EXTRACT) then 

a size-1+i..i «- Cgsize-1+i..dpos+fsize+i II w dpos+fsize-1..dpos II c<jpos-1+1..i 

else 

asize-1+i..i «- w 

endif 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 



Fig. 44G (cont) 



v r\c D/^o it o 
X.UtrUol 1 .Z 


Crossbar deposit signed pecks 


X.UtrUol I .4 


Crossbar deposit signed nibbles 


V RCDHOIT Q 

A.UtrUol 1 .o 


urossoar deposit signed Dytes 


A.UtrUol 1 .10 


urossoar deposit signed doublets 


A.UtrUol 1 .o^ 


urossDar deposit signed quadiets 


A.UtrUol 1 .04 


Crossbar deposit signed octlets 


A.UtrUol 1 . iZo 


Crossbar deposit signed hexlet 


v r\r~ nr\o it i i o 

X.UEPUSIT.U.2 


Crossbar deposit unsigned pecks 


X.DEPOSIT.U.4 


Crossbar deposit unsigned nibbles 


X.DEPOSIT.U.o 


Crossbar deposit unsigned bytes 


X.DEPOSIT.U.16 


— 1 _| • A. 9 ft 11. S 

Crossbar deposit unsigned doublets 


X.DEPOSIT.U.32 


Crossbar deposit unsigned quadiets 


X.DEPOSIT.U.64 


Crossbar deposit unsigned octlets 


X.DEPuSIT.U.128 


Crossbar deposit unsigned hexlet 


X.WITHDRAW.U.2 


Crossbar withdraw unsigned pecks 


V \A/ITUrVD A\ A/ 1 1 >t 

X.WITHDKAW.U.4 


Crossbar withdraw unsigned nibbles 


V lA/ITUHD A\A/ 1 1 O 

X.WI IHURAW.U.o 


Crossbar withdraw unsigned bytes 


v \A/iTunn A\A/ 1 1 A £2 

X.WITHUKAW.U.16 


Crossbar withdraw unsigned doublets 


V \A/ITLinDA\A/ 1 1 OO 1 

X.WITnDRAW.U.o2 


Crossbar withdraw unsigned quadiets 


v \A/iTunn A\A/ 1 1 £> A 

X.WITnDRAW.U.64 > 


Crossbar withdraw unsigned octlets 


V \A/ITUnD AlA/ 1 1 A OO 

X.WITHDRAW.U.128 \ 


Crossbar withdraw unsigned hexlet 


V \A/ITUr\D A\A/ O 

X.WITHDRAW.2 


Crossbar withdraw pecks 


X WITHDRAW A 


v^rooduar wunuraw niDDies 


X.WITHDRAW.8 


Crossbar withdraw bytes 


X.WITHDRAW.16 


Crossbar withdraw doublets 


X.WITHDRAW.32 


Crossbar withdraw quadiets 


X.WITHDRAW.64 


Crossbar withdraw octlets 


X.WITHDRAW. 1 28 


Crossbar withdraw hexlet 



Fig. 45A 



Equivalencies 



Y CCY / 9 


L/rossDar exxena immeaiate signea pecKs 


Y <2PY I A 

A.OCA./.'if 


orossuar exiena immeoiaie signeo niDDies 


Y cry / p 


orossuar exiena immeoiaie signeo oyies 


A..OEA>.l. 10 


urossuar exiena immeaiaie signeo oouoieis 


Y CCY / QO 


orossDar exiena immeaiate signeo quaoiets 


X.ofcX./. 04 


urossoar extend immediate signed octlets 


A.ofcX./. 72o 


Crossbar extend immediate signed hexlet 




frncchar OYtonH immoHiato uncinnoH norl^c 

uiuooudi cAici iu iiiiiiicrUiaio uiioiyneu peci\o 


X.ZEX.1.4 


Crossbar extend immediate unsigned nibbles 


X.ZEX.1.8 


Crossbar extend immediate unsigned bytes ] 


X.ZEXI.16 


Crossbar extend immediate unsigned doublets i 


X.ZEX.1.32 


Crossbar extend immediate unsigned quadlets 1 


X.ZEX.1.64 


Crossbar extend immediate unsigned octlets 


X.ZEXI.128 


Crossbar extend immediate unsigned hexlet 



X.SHLI.gsize rd=rc,i 


-» 


X.DEPOSIT.gsize rd=rc,size-i,i 


X.SHR.I.gsize rd=rc,i 


-> 


X.WITHDRAW.gsize rd=rc,size-i,i 


X.SHRU.I.gsize rd-rc.i 


-> 


X.WITHDRAW.U.gsize rd=rc,size-i,i 


X.SEX.I.gsize rd=rc,i 


-> 


X.DEPOSIT.gsize rd=rc,i,0 


X.ZEX.I.gsize rd=rc,i 


-> 


X.DEPOSIT.U.gsize rd=rc,i,0 


Redundancies 


X.DEPOSIT.gsize rd-rc,gsize,0 


o 


X.COPY rd=rc | 


X.DEPOSIT.U.gsize rd-rc,gsize,0 


o 


X.COPY rd=rc ! 


X.WITHDRAW.gsize rd=rc,gsize,0 


<=> 


X.COPY rd=rc 


X.WITHDRAW.U.gsize rd=rc,gsize,0 


o 


X.COPY rd=rc 



Fig. 45A (cont'd) 



Format 



X.op.gsize rd=rc,isize f ishift 
rd=xopgsize(rc,isize,ishift) 

31 26252423 18 17 1211 65 0 

I op I ih | rd 1 rc 1 gsfp | gsfs 1 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs <- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 



Fig. 45B 



Definition 

def CrossbarField(op,rd,rc,gsfp,gsfs) as 
c <r- RegRead(rc, 128) 
case ((opi || gsfp) and (opo || gsfs)) of 
0..63: 

gsize <- 128 
64..9S: 

gsize <- 64 
96..111: 

gsize <- 32 
112..119: 

gsize <- 1 6 
120..123: 

gsize <- 8 
124..125: 

gsize <- 4 

126: 

gsize <- 2 

127: 

raise Reserved Instruction 

endcase 

ishift <- (opi || gsfp) and (gsize-1) 
isize <- ((opo || gsfs) and (gsize-1 ))+1 
if (ishift+isize>gsize) 

raise Reserved Instruction 

end if 

case op of 

X.DEPOSIT: 

for i <r- 0 to 128-gsize by gsize 

a j+ gsize.1..i <- II Cj + isize-1..i II 0 ishlft 

endfor 
X.DEPOSIT.U: 

for i <- 0 to 128-gsize by gsize 

ai +gS ize-1..i <- OSsize-isize-ishift || C j + j S lze-1 ..i II 0 ishlft 
endfor 
X.WITHDRAW: 

for i <- 0 to 128-gsize by gsize 

ai+gsize-1..i <- cp^f|£§5ihift-1 || Cj+j S ize+ishift-1 ..i+ishift 
endfor 
X.WITHDRAW.U: 

for i <- 0 to 128-gsize by gsize 

aj+gsize-1..i «- 09 size " isi2e || c l+ isi 2e +ishift-1..i+ishift 
endfor 

endcase 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved instruction 

Fig. 45C 




encoding for crossbar field 
Fig. 45D 



< — fefze — ► 




< — fsiz e — >< dpo 



crossbar deposit 
Fig. 45E 



< — faize » 
crossbar withdraw 



Fig. 45F 



Operation c des 



X.DEPOSIT.M.2 


Crossbar deposit merge pecks 


X.DEPOSIT.M.4 


Crossbar deposit merge nibbles 


X.DEPOSIT.M.8 


Crossbar deposit merge bytes 


X.DEP0SIT.M.16 


Crossbar deposit merge doublets 


X.DEPOSIT.M.32 


Crossbar deposit merge quadlets 


X.DEPOSIT.M.64 


Crossbar deposit merge octlets 


X.DEPOSIT.M.128 


Crossbar deposit merge hexlet 



Fig 45G 



Format 



X.op.gsize rd@rc,isize,ishift 
rd=xopgsize(rd,rc,isize,ishift) 

31 26252423 18 17 1211 65 0 

I QP MM rd | rc | gsfp 1 gsfs | 

6 2 6 6 6 6 

assert isize+ishift < gsize 
assert isize>1 

iho || gsfs <- 128-gsize+isize-1 
ihi || gsfp <- 128-gsize+ishift 



Fig 45H 



Definition 

def CrossbarFieldlnplace(op,rd,rc,gsfp,gsfs) as 
c <- RegRead(rc, 128) 
d <- RegRead(rd, 128) 
case ((opi || gsfp) and (opo || gsfs)) of 
0..63: 

gsize <- 128 
64..9S: 

gsize *- 64 
96..111: 

gsize <- 32 
112..119: 

gsize <- 16 
120..123: 

gsize <- 8 
124..125: 

gsize <- 4 

126: 

gsize <- 2 

127: 

raise Reserved Instruction 

endcase 

ishift <~ (opi || gsfp) and (gsize-1 ) 
isize <- ((opo || gsfs) and (gsize-1 ))+1 
if (ishift+isize>gsize) 

raise Reserved Instruction 

end if 

for i <- 0 to 128-gsize by gsize 

aj+gsize-1.J «- dj+gsize-1 ..i+isize+ishift II Ci+i S ize-1..i II dj+ishift-1 
endfor 

RegWrite(rd, 128, a) 
enddef 

Exceptions 

Reserved instruction 

Fig 45! 



< — foizo — ► 




< — fsiz e — >< dpoa 
crossbar deposit merge 



Fig 45J 



X.SHUFFLE.4 


Crossbar shuffle within pecks 


V 0 1 1 1 ICCI d Q 

A.orlUrrLb.o 


Crossbar shuffle within bytes 


X.SHUFFLE.16 


Crossbar shuffle within doublets 


X.SHUFFLE.32 


Crossbar shuffle within quadlets 




X.SHUFFLE.64 


Crossbar shuffle within octlets 


XSHUFFLE.128 


Crossbar shuffle within hexlet 


X.SHUFFLE.256 


Crossbar shuffle within triclet 



Fig. 46A 



Format 



X.SHUFFLE.256 rd=rc,rb I v,w,h 
X.SHUFFLE.size rd=rcb,v,w 

rd=xshuffle256(rc,rb,v,w,h) 
rd=xshufflesize(rcb,v,w) 

31 24 23 18 17 12 11 6 5 0 

I X.SHUFFLE | rd | rc | rb | op j 

8 6 6 6 6 

rc <- rb <- rcb 
x<-log2(size) 
y*-log2(v) 
z<-log2(w) 

op <r- ((x*x*x-3*x*x-4*x)/6-(z*z-z)/2+x*z+y) + (size=256)*(h*32-56) 



Fig. 46B 



Definition 



def CrossbarShufflefmajor.rd.rc.rb.op) 
c <r- RegRead(rc t 128) 
b <- RegRead(rb, 128) 
if rc=rb then 
case op of 
0..55: 

for x <- 2 to 7; for y <- 0 to x-2; for z <- 1 to x-y-1 

if op = ((x*x*x-3*x*x-4*x)/6-(z*z-z)/2+x*z+y) then 
fori<-0to 127 

a " *~ C ('6..x II iy+z-1..y II «x-1..y+z II iy-1..o) 

end 

end if 

endfor; endfor; endfor 
S6..63: 

raise Reserved Instruction 

endcase 

elseif 

case op4„o of 
0..27: 

cb <r- c || b 
x <- 8 
h^-ops 

for y <- 0 to x-2; for z <- 1 to x-y-1 

^ OP4..0 = ((1 7*z-z*z)/2-8+y) then 
fori<-h*128to127+h*128 

aj-h*l28 *- cb^.y || j x -i..y + z || iy.L.0) 

end 

end if 
endfor; endfor 
28..31: 

raise Reservedlnstruction 

endcase 

end if 

RegWrite(rd, 128, a) 
enddef 



Exceptions 

Reserved Instruction 



Fig. 46C 



127 



rcb(128) 




127 



rd(128) 



4-way shuffle bytes within hexlet 



Fig. 46D 




- Egg ^ .~ » a isg ca sa ess 



127 rd(128) o 



4-way shuffle bytes within triclet 
Fig. 46E 



Format 



X.SWIZZLE rd=rc,icopy,iswap 
rd=xswizzle(rc,icopy,iswap) 

31 26 2524 23 18 17 12 11 6 5 0 

| X.SWIZZLE I ih I rd | rc | icopya | iswapa H 

6 2 6 6 6 6 

icopya 4- icopy5..o 
iswapa <- iswaps..o 
ih <- icopy 6 || iswap6 

Fig. 47A 



Definition 

def GroupSwizzlelmmediate(ih,rd,rc,icopya,iswapa) as 
icopy <- ihi || icopya 

iswap <- iho || iswapa 
c <r- RegRead(rc, 128) 
fori<-0to127 

3i C(j & icopy) A iswap 
endfor 

RegWrite(rd. 128, a) 
enddef 

Exceptions 

none 



Fig. 47B 




16-bit reverse 



Fig. 47C 



IX.SELECT.8 



Crossbar select bytes 



Format 



op ra=rd,rc,rb 
ra=op(rd,rc,rb) 

31 



24 23 



18 17 



12 11 



6 5 



rd 



rc 



rb 



ra 



6 

Fig. 47D 



Definition 

def CrossbarTernaryfop.rd.rc.rb.ra) as 
d «- RegRead(rd, 128) 
c <- RegRead(rc, 128) 
b <- RegRead(rb, 128) 
dc«-d||c 
fori<-0to 15 
j <- bs*i+4..8*i 

38*i+7..8 # i <- dC8*j+7..8*j 
endfor 

RegWrite(ra, 128, a) 
enddef 

Exceptions 

none 

Fig. 47E 



Pin summary 



A20M# 


I 


Address bit 20 Mask is an emulator signal. 


A31..A3 


10 


Address, in combination with byte enable, indicate the 
physical addresses of memory or device that is the target 
of a bus transaction. This signal is an output, when the 
processor is initiating the bus transaction, and an input 
when the processor is receiving an inquire transaction or 
snooping another processor's bus transaction. 


ADS# 


10 


ADdress Strobe, when asserted, indicates new bus 
transaction by the processor, with valid address and byte 
enable simultaneously driven. 


ADSC# 


0 


Address Strobe Copy is driven identically to address 
strobe 


AHOLD 


1 


Address HOLD, when asserted, causes the processor to 
cease driving address and address parity in the next bus 
clock cycle. 


AP 


10 


Address Parity contains even parity on the same cycle as 
address. Address parity is generated by the processor 
when address is an output, and is checked when address 
is an input. A parity error causes a bus error machine 
check. 


APCHK# 


0 


Address Parity CHecK is asserted two bus clocks after 
EADS# if address parity is not even parity of address. 


APICEN 


1 


Advanced Programmable Interrupt Controller ENable 

is not implemented. 


BE7#..BE0# 


10 


Byte Enable indicates which bytes are the subject of a 
read or write transaction and are driven on the same cycle 
as address. 


BF1..BF0 


1 


Bus Frequency is sampled to permit software to select 
the ratio of the processor clock to the bus clock. 


bUrrff 


1 

1 


BackOFF is sampled on the rising edge of each bus clock, 
and when asserted, the processor floats bus signals on the 
next bus clock and aborts the current bus cycle, until the 

hppkoff Qional ic camnloH nonotorl 
ua\*i\\JH oiLJtldl lo odllipiUU ilcyalcvJ. 


BP3..BP0 


0 


Breakpoint is an emulator signal. 


BRDY# 


1 


Bus ReaDY indicates that valid data is present on data on 
a read transaction, or that data has been accepted on a 
write transaction. 


BRDYC# 


1 


Bus ReaDY Copy is identical to BRDY#; asserting either 
signal has the same effect. 


BREQ 


0 


Bus REQuest indicates a processor initiated bus request. 



Fig. 48 



BUSCHK# 


1 


BUS CHecK is sampled on the rising edge of the bus 
clock, and when asserted, causes a bus error machine 
check. 


CACHE# 


0 


CACHE, when asserted, indicates a cacheable read 
transaction or a burst write transaction. 


CLK 


1 


bus CLocK provides the bus clock timing edge and the 
frequency reference for the processor clock. 


CPUTYP 


1 


CPU TYPe, if low indicates the primary processor, if high, 
the dual processor. 


D/C# 


1 


Data/Code is driven with the address signal to indicate 
data, code, or special cycles. 


D63..D0 


10 


Data communicates 64 bits of data per bus clock. 


D/P# 


0 


Dual/Primary is driven (asserted, low) with address on 
the primary processor 


DP7..DP0 


10 


Data Parity contains even parity on the same cycle as 
data. A parity error causes a bus error machine check. 


DPEN# 


10 


Dual Processing Enable is asserted (driven low) by a 
Dual processor at reset and sampled by a Primary 
processor at the falling edge of reset. 


EADS# 


1 


External Address Strobe indicates that an external 
device has driven address for an inquire cycle. 


EWBE# 


1 


External Write Buffer Empty indicates that the external 
system has no pending write. 


FERR# 


0 


Floating point ERRor is an emulator signal. 


FLUSH# 


1 


cache FLUSH is an emulator signal. 


FRCMC# 


1 


Functional Redundancy Checking Master/Checker is 

not implemented. 


HIT# 


10 


HIT indicates that an inquire cycle or cache snoop hits a 
valid line. 


HITM# 


10 


HIT to a Modfied line indicates that an inquire cycle or 
cache snoop hits a sub-block in the M cache state. 


HLDA 


o 


bus HoLD Acknowlege is asserted (driven high) to 
acknowlege a bus hold request 


HOLD 


1 


bus HOLD request causes the processor to float most of 
its pins and assert bus hold acknowlege after completing 
all outstanding bus transactions, or during reset. 


IERR# 


0 


Internal ERRor is an emulator signal. 


IGNNE# 


1 


IGNore Numeric Error is an emulator signal. 


INIT 


1 


INITializat.on is an emulator signal. 


INTR 


1 


maskable IN TeRrupt is an emulator signal. 


INV 


1 


INValidation controls whether to invalidate the addressed 
cache sub-block on an inqure transaction. 



Fig. 48 (c nt'd) 



KEN# 


I 


Cache ENable is driven with address to indicate that the 
read or write transaction is cacheable. 


LINT1..LINT0 


I , 


Local INTerrupt is not implemented. 


LOCK# 


0 


bus LOCK is driven starting with address and ending 
after bus ready to indicate a locked series of bus 
transactions. 


M/IO# 


O 


Memory/Input Output is driven with address to indicate a 
memory or I/O transaction. 


NA# 


I 


Next Address indicates that the external system will 
accept an address for a new bus cycle in two bus clocks. 


NMI 


I 


Non Maskable Interrupt is an emulator signal. 


PBGNT# 


IO 


Private Bus GraNT is driven between Primary and Dual 
processors to indicate that bus arbitration has completed, 
granting a new master access to the bus. 


PBREQ# 


IO 


Private Bus REQuest is driven between Primary and Dual 
processors to request a new master access to the bus. 


PCD 


0 


Page Cache Disable is driven with address to indicate a 
not cacheable transaction. 


PCHK# 


o 


Parity CHecK is asserted (driven low) two bus clocks after 
data appears with odd parity on enabled bytes. 


PHIT# 


IO 


Private HIT is driven between Primary and Dual 
processors to indicate that the current read or write 
transaction addresses a valid cache sub-block in the slave 
processor. 


PHITM# 


IO 


Private HIT Modified is driven between Primary and Dual 
processors to indicate that the current read or write 
transaction addresses a modified cache sub-block in the 
slave processor. 


PICCLK 


I 


Programmable Interrupt Controller CLocK is not 

implemented. 


PICD1..PICD 
0 


IO 


Programmable Interrupt Controller Data is not 

implemented. 


PEN# 


I 


Parity Enable, if active on the data cycle, allows a parity 
error to cause a bus error machine check. 


PM1..PM0 


O 


Performance Monitoring is an emulator signal. 


PRDY 


0 


Probe ReaDY is not implemented. 


PWT 


O 


Page Write Through is driven with address to indicate a 
not write allocate transaction. 


R/S# 


! 


Run/Stop is not implemented. ] 


RESET 


I 


RESET causes a processor reset. 


SCYC 


O 


Split CYCIe is asserted during bus lock to indicate that 
more than two transactions are in the series of bus 
transactions. 



Fig. 48 (cont'd) 



SMI# 


1 


System Management Interrupt is an emulator signal. 


SMIACT# 


0 


System Management Interrupt ACTIve is an emulator 
signal. 


STPCLK# 


1 


SToP CLocK is an emulator signal. 


TCK 


1 


Test CLocK follows IEEE 1149.1. 


TDI 


1 


Test Data Input follows IEEE 1149.1. 


TDO 


0 


Test Data Output follows IEEE 1 149.1 . 


TMS 


1 


Test Mode Select follows IEEE 1 149.1 . 


TRST# 


1 


Test ReSeT follows IEEE 1 149.1 . 


VCC2 


1 


VCC of 2.8V at 25 pins 


VCC3 


1 


VCC of 3.3V at 28 pins 


VCC2DET# 


0 


VCC2 DETect sets appropriate VCC2 voltaqe level. 


VSS 


1 


VSS supplied at 53 pins 


W/R# 


0 


Write/Read is driven with address to indicate write vs. 
read transaction. 


WB/WT# 


1 


Write Back/Write Through is returned to indicate that 
data is permitted to be cached as write back. 



Fig. 48 (cont'd) 



Electrical Specifications 



Clock rate 


66 MHz 


75 MHz 


100 MHz 


133 MHz 




Parameter 


min 


max 


min 


max 


min 


max 


min 


max 


• mil 

unii 


C*\ \C frpni ipnrv 

wLi\ IICLjutJNvy 


oo.o 


fiR 7 


^7 ^ 
Of .o 


7*^ 


^n 


I uu 




A 11 

loo 


K All 

MM 


CLK period 


15.0 


30.0 


13.3 


26.3 


10.0 


20.0 






ns 


CLK high time (>2v) 


4.0 




4.0 




3.0 








ns 


CLK low time (<0.8V) 


4.0 




4.0 




3.0 








ns 


CLK rise time (0.8V->2V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK fall time (2V->0.8V) 


0.15 


1.5 


0.15 


1.5 


0.15 


1.5 






ns 


CLK period stability 




250 




250 




250 






ps 



Fig. 49A 



mo i ..o vaiiu ueiay 


1 1 
i . i 


0.0 


A A 

1 .1 


4.0 


A A 


A A 

4.U 






ns 


A^l ^ float Holow 
MO I ..O HUal Ucldy 




in o 




7 0 
( .U 




7 A 
/ .U 






ns 


AHQif valid Holov/ 
ML/Ott VdllU UtJIdy 


1 o 


O.U 


1 0 
I .U 


*t.O 


A O 
i .U 


/i n 
4.U 






ns 


AH^# float Hplav 




in n 

I u.u 




7 0 




7 n 
f .u 






ns 


AnRH# valid Hplau 

AAL/Owtt VdllU Lit? Id y 


1 .u 


7 0 


1 0 


*t.O 


1 o 

I .u 


a n 

4.U 






ns 


AH^Pif float Holax/ 
nUOvvfr llUdl Ucldy 




10 0 
I u.u 




7 n 
/ .U 




7 n 
r .U 






ns 


AD x/aliH Holax/ 
nr VdllU Ucldy 


1 o 


ft *x 

o.o 


1 0 


^ R 

0.0 


1 o 

1 .u 


0.0 






ns 


A D flr\at rlalo\/ 
Mr TlOal delay 




ia a 
1U.U 




7 A 
f .U 




7 n 
7.0 






ns 


MrUrif\ff VallO ueiay 


4 a 
i .U 


Q O 

o.o 


i A 

I.U 


4.0 


4 o 

1.0 


4.5 






ns 


RP7 0£ waliH Holow 
DC f ..Urr VdllU ueiay 


1 o 

1 .u 


7 a 
f .U 


1 A 
1 .U 


4.0 


4 A 
1 .U 


A A 

4.U 






ns 


DC7 H# flr\ot HaIou 

c3t(..uff iioai QGiay 




4A a 
1U.U 




7 A 

1 .U 




7.0 






ns 


DDQ A woli/4 

□ro„u vana aeiav 


4 a 
1 .U 


1U.U 














ns 


dkcu vana ueiay 


a a 


o.U 


A A 
1 .U 


4.0 


4 A 
1.0 


>i 0 
4.0 






ns 


vvMuncff Vdiiu ueiay 


a a 
1 .U 


/ .U 


A A 
1 .U 


4.0 


4 A 
1.0 


A A 

4.0 






ns 


PAPWPif float Holax/ 
vvMvvnCff TlOdl U6ldy 




1U.U 




7 A 
/ .U 




7.0 






ns 


uiKstr Vaiiu ueiay 


a n 

1 .U 


7 n 
( .U 


A A 

I.U 


A C 

4.0 


4 A 
1.0 


A O 

4.0 






ns 


n/Pi£ float Holax/ 

uf\sfr nodi ueiay 




-in n 
1U.U 




7 A 
/ .U 




7.0 






ns 


l"^fi^ 0 tA/rito Hata \/aliH rlalov/ 

udo..u wine uaia vaiiu ueiay 


1 .0 


7 £ 


i o 

1 .o 


4.0 


4 O 
1.0 


4.5 






ns 


PiR*^ n iA/rito Hoto f\r\nt Halovi 

uoo.-u wriie uaia iioai aeiay 




1U.U 




"7 A 

7.0 




7.0 






ns 


ur/..u wriie aaxa vaiiu ueiay 


4 o 
1 .0 


7 C 

/.O 


1.0 


4.5 


1.3 


4.5 






ns 


PiPY n \A/rito Hoto float Holow 

urf ..u wriie uaia Tioax ueiay 




in a 
1U.U 




7 A 

(SJ 




7.0 






ns 


CCDDtf woliH Holow 

rtKKff vaiiu ueiay 


-i n 


O.O 


A A 
1.0 


A C 

4.5 


4 O 

1.0 


4.5 






ns 


WITif woliH Hoi aw 

ni i tt Vaiiu ueiay 


a n 

1 .U 


O.O 


4 A 

I.U 


A C 

4.0 


4 A 

1.0 


>i 0 
4.0 






ns 


MITMif waliH Holax/ 1 
ni 1 IVIrr VdllU Ueidy 


A A 

1 .1 


ft n 
o.U 


A A 1 
1.1 


A C 

4.0 


4 4 
1.1 


A A 

4.0 






ns 


nLUn vana aeiay 


4 n 
I.U 


O.O 


4 A 

1.0 


4.5 


4 O 

1.0 


4.0 




-■ ■ 


ns 


IPRPif waliH Holow 
iCixrxrr Vdli^UeidV 


1 .U 


O.O 














ns 


1 nPl^if x/aliH Holax/ 

Lv-/vvr\tr Vaiiu ueiay 


i 1 

i .1 


7 n 
/ .U 


4 A 
1.1 


4.0 


4 4 
1.1 


A A 

4.0 






ns 


1 OPKii float Holax/ 

Luui\tt nodi ueiay 
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Format 



op rd=rc,rb 
rd=op(rc,rb) 

31 24 23 18 17 12 11 6 5 0 

I L.MINOR | rd | rc | rb | op | 

8 6 6 6 6 
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Definition 



def Load(op,rd,rc,rb) as 
case op of 

L16L, L32L, L8, L16AL, L32AL. L16B, L32B, L16AB, L32AB. 
L64L, L64AL, L64B, L64AB: 
signed <- true 

LU16L, LU32L, LU8. LU16AL, LU32AL, LU16B, LU32B, LU16AB, LU32AB, 
LU64L, LU64AL, LU64B, LU64AB: 

signed false 
L128L, L128AL, L128B, L128AB: 

signed <- undefined 

endcase 
case op of 
L8.LU8: 

size <- 8 

L16L, LU16L, L16AL. LU16AL, L16B, LU16B, L16AB, LU16AB: 
size <- 16 

L32L, LU32L, L32AL, LU32AL, L32B, LU32B, L32AB, LU32AB: 
size <- 32 

L64L, LU64L. L64AL, LU64AL, L64B, LU64B, L64AB, LU64AB: 

size 64 
L128L, L128AL, L128B, L128AB: 

size<- 128 

endcase 

Isize <- log(size) 

case op of 

L16L, LU16L, L32L, LU32L, L64L, LU64L, L128L, 
L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL: 
order <- L 

L16B, LU16B. L32B, LU32B, L64B, LU64B, L128B, 

L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 

order <- B 
L8, LU8: 

order <- undefined 

endcase 
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c <- RegRead(rc, 64) 

b «- RegRead(rb, 64) 

VirtAddr <- c + (b 66 -| S ize..O II 0 lsize - 3 ) 

case op of 

L16AL, LU16AL, L32AL, LU32AL, L64AL, LU64AL, L128AL, 
L16AB, LU16AB, L32AB, LU32AB, L64AB, LU64AB, L128AB: 

if (C|size-4..0 * 0 th © n 

raise AccessDisallowedByVirtualAddress 

end if 

L16L, LU16L, L32L, LU32L, L64L, LU64L, L128L, 
L16B, LU16B, L32B, LU32B, L64B, LU64B, L128B: 
L8 f LU8: 
endcase 

m «- LoadMemory(c,VirtAddr,size,order) 
a <- (™size-1 an d signed) 1 28-size || m 
RegWrite(rd, 128, a) 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 50C (cont) 



Operation cod s 
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Load immediate signed byte 
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Load immediate signed doublet aligned big-endian 
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L.I.16.A.L 


Load immediate signed doublet aligned little-endian 
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Format 



op rd=rc,offset 
rd=op(rc,offset) 
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op | rd | rc | offset I 
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Definition 



def Loadlmmediate(op,rd,rc,offset) as 
case op of 

LI16L, LI32L, LI8, LI16AL, LI32AL, LI16B, LI32B, LI16AB, LI32AB: 
LI64L, LI64AL, LI64B, LI64AB: 

signed <- true 
LIU16L. LIU32L, LIU8, LIU16AL, LIU32AL, . 
LIU16B, LIU32B, LIU16AB, LIU32AB: 
LIU64L, LIU64AL, LIU64B, LIU64AB: 

signed <- false 
LI128L, LI128AL, LI128B, LI128AB: 

signed <- undefined 

endcase 
case op of 

LI8, LIU8: 
size <- 8 

LI16L. LIU16L, LI16AL, LIU16AL, LI16B. LIU16B, LI16AB. LIU16AB 
size <- 16 

LI32L. LIU32L, LI32AL. LIU32AL, LI32B, LIU32B, LI32AB, LIU32AB 
size <- 32 

LI64L, LIU64L, LI64AL, LIU64AL, LI64B, LIU64B, LI64AB, LIU64AB 

size < 64 

LI128L, LI128AL, LI128B, LI128AB: 

size <- 128 

endcase 

Isize <~ log(size) 

case op of 

LI16L, LIU16L, LI32L, LIU32L, L164L, LIU64L, LI128L, 
LI16AL. LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL: 
order LI 

LI16B, LIU16B, LI32B, LIU32B, LI64B, LIU64B, LI128B, 

LI16AB, LIU16AB, LI32AB, LIU32AB, LI64AB, LIU64AB, U128AB: 

order <- B 
LI8, LIU8: 

order <r- undefined 

endcase 
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c <- RegRead(rc, 64) 

VirtAddr <- c + (offsetf f- |slze || offset || 0 ,size - 3 ) 
case op of 

LI16AL, LIU16AL, LI32AL, LIU32AL, LI64AL, LIU64AL, LI128AL, 
LI16AB, LIU16AB, LI32AB, LIU32AB, LI64AB, LIU64AB, LI128AB: 
if (cisize-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

end if 

LI16L, LIU16L, LI32L, LIU32L, LI64L, LIU64L, LI128L, 
LI16B, LIU16B, LI32B, LIU32B, LI64B, LIU64B, LI128B: 
LI8, LIU8: 
endcase 

m «- LoadMemory(c,VirtAddr,size,order) 
a «- (™size-1 and signed) 1 28 " size || m 
RegWrite(rd, 128, a) 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 51C(cont) 
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o ivji t? Ljuduid diiynt?u iiiut?-t?i luiai i 


S 64 R 


oiuic UL*llc?L Uiy-tJi lUlai 1 


S.64.A.B 


Store octlet aligned big-endian 


S.64.L 


Store octlet little-endian 


S.64.A.L 


Store octlet aligned little-endian 


S.128.B 


Store hexlet big-endian 


S.128.A.B 


Store hexlet aligned big-endian 


S.128.L 


Store hexlet little-endian 


S.128.A.L 


Store hexlet aligned little-endian 


S.MUX.64.A.B 


Store multiplex octlet aligned big-endian 


S.MUX.64.A.L 


Store multiplex octlet aligned little-endian 



Fig. 52A 
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Format 



op rd.rc.rb 
op(rd,rc,rb) 

31 24 23 18 17 12 11 65 0 

I sImINOR I rd I rc I rb I op I 

8 6 6 6 6 



Fig. 52B 



Definition 



def Store(op,rd,rc,rb) as 
case op of 
S8: 

size <r~ 8 
S16L.S16AL, S16B, S16AB: 

size 16 
S32L, S32AL, S32B, S32AB: 

size <- 32 
S64L, S64AL, S64B, S64AB, 
SMUX64AB, SMUX64AL: 

size <- 64 
S128L, S128AL, S128B, S128AB: 

size <- 128 

endcase 
Isize <- log(size) 
case op of 
S8: 

order <- undefined 
S16L, S32L, S64L, S128L, 
S16AL, S32AL, S64AL, S128AL, SMUX64ALI: 

order «- L 
S16B, S32B, S64B, S128B, 
S16AB, S32AB, S64AB, S128AB, SMUX64ABI: 

order <- B 

endcase 

c <r- RegRead(rc, 64) 

b <- RegRead(rb, 64) 

VirtAddr <- c + (b 6 6-lsize..O II 0 ,slze - 3 ) 

case op of 

S16AL, S32AL, S64AL, S128AL, 
S16AB, S32AB, S64AB, S128AB, 
SMUX64AB, SMUX64AL: 
if (C|size-4..0 ^ 0 ^en 

raise AccessDisallowedByVirtualAddress 

endif 

S16L,S32L,S64L,S128L, 
S16B.S32B, S64B, S128B: 
S8: 
endcase 



Fig. 52C 



d <- RegRead(rd, 128) 
case op of 
S8, 

S16L.S16AL.S16B, S16AB, 
S32L, S32AL, S32B, S32AB, 
S64L, S64AL, S64B, S64AB, 
S128L, S128AL, S128B, S128AB: 

StoreMemory(c t VirtAddr f size,order f d S i 2e -i..o) 
SMUX64AB, SMUX64AL: 

lock 

a <- LoadMemoryWfc.VirtAddr.size.order) 

m «- (di27..64 & d63..0) I (a & -d63..0) 
StoreMemory^.VirtAddr.size.ordenm) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 52C (cont) 



Operation codes 



O 1 o 

5.1.8 


Store immediate byte 


S.I.16.A.D 


Store immediate double aligned big-endian 


S.I.16.B 


Store immediate. double big-endian 


S.I.16.A.L 


Store immediate double aligned little-endian 


S.I.16.L 


Store immediate double little-endian 


S.I.32.A.B 


Store immediate quadlet aligned big-endian 


S.I.32.B 


Store immediate quadlet big-endian 


S.I.32.A.L 


Store immediate quadlet aligned little-endian 


S.I. 32. L 


Store immediate quadlet little-endian 


S.I.64.A.B 


Store immediate octlet aligned big-endian 


O.I.04.D 


oiore immeaiate ocxiet Dig-enaian 


S.I.64.A.L 


Store immediate octlet aligned little-endian 


S.I.64.L 


Store immediate octlet little-endian 


S.I.128.A.B 


Store immediate hexlet aligned big-endian 


S.I.128.B 


Store immediate hexlet big-endian 


S.I.128.A.L 


Store immediate hexlet aligned little-endian 


S.I.128.L 


Store immediate hexlet little-endian 


S.MUXI.64.A.B 


Store multiplex immediate octlet aligned big-endian 


S.MUXI.64.A.L 


Store multiplex immediate octlet aligned little-endian 



Fig. 53A 
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L B 


integer aligned 




16 32 64 128 


A 


L B 


multiplex 


MUX 


64 


A 


L B 



Format 



S.op.l.size.align.order rd.rc.offset 
sopisizealignorder(rd,rc,offset) 

31 24 23 18 17 12 11 0 

I op | rd | rc | offset 

8 6 6 12 

Fig. 53B 



Definition 



def Storelmmediate(op,rd,rc,offset) as 
case op of 
SI8: 

size <r- 8 
SI16L, SI16AL, SI16B, SI16AB: 

size <- 16 
SI32L, SI32AL, SI32B, SI32AB: 

size <r- 32 

SI64L, SI64AL, SI64B, SI64AB, SMUXI64AB, SMUXI64AL: 

size «- 64 
SI128L, SI128AL, SI128B, SI128AB: 

size <r- 128 

endcase 
Isize <- log(size) 
case op of 
SI8: 

order <- undefined 
SI16L, SI32L, SI64L, SI128L, 
SI16AL, SI32AL, SI64AL, SI128AL, SMUXI64AL: 

order <- L 
SI16B, SI32B, SI64B, SI128B, 
SI16AB, SI32AB, SI64AB, SI128AB, SMUXI64AB: 

order «- B 

endcase 

c <- RegRead(rc, 64) 

VirtAddr <- c + (offset?f- ,size || offset || 0 ,size - 3 ) 

case op of 

SI16AL, SI32AL, SI64AL, SI128AL, 
SI16AB, SI32AB, SI64AB, SI128AB, 
SMUXI64AB, SMUXI64AL: 
if ( c lsize-4..0 * 0 then 

raise AccessDisallowedByVirtualAddress 

end if 

SI16L, SI32L, S164L, SI128L, 
SI16B, SI32B, SI64B, SI128B: 
SI8: 
endcase 



Fig. 53C 



d <- RegRead(rd, 128) 
case op of 
SI8, 

SI16L, SI16AL, SI16B, SI16AB, 
SI32L, SI32AL, SI32B, SI32AB, 
SI64L, SI64AL, SI64B, SI64AB, 
SI128L, SI128AL, SI128B, SI128AB: 

StoreMemory(c,VirtAddr t size f order f d s j 2 e-i..o) 
SMUXI64AB, SMUXI64AL: 

lock 

a <- LoadMemoryWfc.VirtAddr.size.order) 

m <- (di27..64 & d63..0) I (a & -d 6 3..o) 
StoreMemoryfc.VirtAddr.size.order.m) 
endlock 

endcase 
enddef 

Exceptions 

Access disallowed by virtual address 
Access disallowed by tag 
Access disallowed by global TB 
Access disallowed by local TB 
Access detail required by tag 
Access detail required by local TB 
Access detail required by global TB 
Local TB miss 
Global TB miss 

Fig. 53C (cont) 
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